6 * Copyright (c) 1999-2003 The SquirrelMail Project Team
7 * Licensed under the GNU GPL. For full terms see the file COPYING.
9 * This file contains variuos functions that are needed to do
10 * internationalization of SquirrelMail.
12 * Internally the output character set is used. Other characters are
13 * encoded using Unicode entities according to HTML 4.0.
18 require_once(SM_PATH
. 'functions/global.php');
20 /* Decodes a string to the internal encoding from the given charset */
21 function charset_decode ($charset, $string) {
22 global $languages, $squirrelmail_language;
24 if (isset($languages[$squirrelmail_language]['XTRA_CODE']) &&
25 function_exists($languages[$squirrelmail_language]['XTRA_CODE'])) {
26 $string = $languages[$squirrelmail_language]['XTRA_CODE']('decode', $string);
29 /* All HTML special characters are 7 bit and can be replaced first */
31 $string = htmlspecialchars ($string);
33 $charset = strtolower($charset);
37 if (ereg('iso-8859-([[:digit:]]+)', $charset, $res)) {
39 $ret = charset_decode_iso_8859_1 ($string);
40 } else if ($res[1] == '2') {
41 $ret = charset_decode_iso_8859_2 ($string);
42 } else if ($res[1] == '4') {
43 $ret = charset_decode_iso_8859_4 ($string);
44 } else if ($res[1] == '5') {
45 $ret = charset_decode_iso_8859_5 ($string);
46 } else if ($res[1] == '7') {
47 $ret = charset_decode_iso_8859_7 ($string);
48 } else if ($res[1] == '9') {
49 $ret = charset_decode_iso_8859_9 ($string);
50 } else if ($res[1] == '13') {
51 $ret = charset_decode_iso_8859_13 ($string);
52 } else if ($res[1] == '15') {
53 $ret = charset_decode_iso_8859_15 ($string);
55 $ret = charset_decode_iso_8859_default ($string);
57 } else if ($charset == 'ns_4551-1') {
58 $ret = charset_decode_ns_4551_1 ($string);
59 } else if ($charset == 'koi8-r') {
60 $ret = charset_decode_koi8r ($string);
61 } else if ($charset == 'koi8-u') {
62 $ret = charset_decode_koi8u ($string);
63 } else if ($charset == 'windows-1251') {
64 $ret = charset_decode_windows_1251 ($string);
65 } else if ($charset == 'windows-1253') {
66 $ret = charset_decode_windows_1253 ($string);
67 } else if ($charset == 'windows-1254') {
68 $ret = charset_decode_windows_1254 ($string);
69 } else if ($charset == 'windows-1257') {
70 $ret = charset_decode_windows_1257 ($string);
71 } else if ($charset == 'utf-8') {
72 $ret = charset_decode_utf8 ($string);
80 iso-8859-1 is the same as Latin 1 and is normally used
83 function charset_decode_iso_8859_1 ($string) {
84 global $default_charset;
86 if (strtolower($default_charset) <> 'iso-8859-1') {
87 /* Only do the slow convert if there are 8-bit characters */
88 if (ereg("[\200-\377]", $string)) {
89 $string = str_replace("\201", '', $string);
90 $string = str_replace("\202", '‚', $string);
91 $string = str_replace("\203", 'ƒ', $string);
92 $string = str_replace("\204", '„', $string);
93 $string = str_replace("\205", '…', $string);
94 $string = str_replace("\206", '†', $string);
95 $string = str_replace("\207", '‡', $string);
96 $string = str_replace("\210", 'ˆ', $string);
97 $string = str_replace("\211", '‰', $string);
98 $string = str_replace("\212", 'Š', $string);
99 $string = str_replace("\213", '‹', $string);
100 $string = str_replace("\214", 'Œ', $string);
101 $string = str_replace("\215", '', $string);
102 $string = str_replace("\216", 'Ž', $string);
103 $string = str_replace("\217", '', $string);
104 $string = str_replace("\220", '', $string);
105 $string = str_replace("\221", '‘', $string);
106 $string = str_replace("\222", '’', $string);
107 $string = str_replace("\223", '“', $string);
108 $string = str_replace("\224", '”', $string);
109 $string = str_replace("\225", '•', $string);
110 $string = str_replace("\226", '–', $string);
111 $string = str_replace("\227", '—', $string);
112 $string = str_replace("\230", '˜', $string);
113 $string = str_replace("\231", '™', $string);
114 $string = str_replace("\232", 'š', $string);
115 $string = str_replace("\233", '›', $string);
116 $string = str_replace("\234", 'œ', $string);
117 $string = str_replace("\235", '', $string);
118 $string = str_replace("\236", 'ž', $string);
119 $string = str_replace("\237", 'Ÿ', $string);
120 $string = str_replace("\240", ' ', $string);
121 $string = str_replace("\241", '¡', $string);
122 $string = str_replace("\242", '¢', $string);
123 $string = str_replace("\243", '£', $string);
124 $string = str_replace("\244", '¤', $string);
125 $string = str_replace("\245", '¥', $string);
126 $string = str_replace("\246", '¦', $string);
127 $string = str_replace("\247", '§', $string);
128 $string = str_replace("\250", '¨', $string);
129 $string = str_replace("\251", '©', $string);
130 $string = str_replace("\252", 'ª', $string);
131 $string = str_replace("\253", '«', $string);
132 $string = str_replace("\254", '¬', $string);
133 $string = str_replace("\255", '­', $string);
134 $string = str_replace("\256", '®', $string);
135 $string = str_replace("\257", '¯', $string);
136 $string = str_replace("\260", '°', $string);
137 $string = str_replace("\261", '±', $string);
138 $string = str_replace("\262", '²', $string);
139 $string = str_replace("\263", '³', $string);
140 $string = str_replace("\264", '´', $string);
141 $string = str_replace("\265", 'µ', $string);
142 $string = str_replace("\266", '¶', $string);
143 $string = str_replace("\267", '·', $string);
144 $string = str_replace("\270", '¸', $string);
145 $string = str_replace("\271", '¹', $string);
146 $string = str_replace("\272", 'º', $string);
147 $string = str_replace("\273", '»', $string);
148 $string = str_replace("\274", '¼', $string);
149 $string = str_replace("\275", '½', $string);
150 $string = str_replace("\276", '¾', $string);
151 $string = str_replace("\277", '¿', $string);
152 $string = str_replace("\300", 'À', $string);
153 $string = str_replace("\301", 'Á', $string);
154 $string = str_replace("\302", 'Â', $string);
155 $string = str_replace("\303", 'Ã', $string);
156 $string = str_replace("\304", 'Ä', $string);
157 $string = str_replace("\305", 'Å', $string);
158 $string = str_replace("\306", 'Æ', $string);
159 $string = str_replace("\307", 'Ç', $string);
160 $string = str_replace("\310", 'È', $string);
161 $string = str_replace("\311", 'É', $string);
162 $string = str_replace("\312", 'Ê', $string);
163 $string = str_replace("\313", 'Ë', $string);
164 $string = str_replace("\314", 'Ì', $string);
165 $string = str_replace("\315", 'Í', $string);
166 $string = str_replace("\316", 'Î', $string);
167 $string = str_replace("\317", 'Ï', $string);
168 $string = str_replace("\320", 'Ð', $string);
169 $string = str_replace("\321", 'Ñ', $string);
170 $string = str_replace("\322", 'Ò', $string);
171 $string = str_replace("\323", 'Ó', $string);
172 $string = str_replace("\324", 'Ô', $string);
173 $string = str_replace("\325", 'Õ', $string);
174 $string = str_replace("\326", 'Ö', $string);
175 $string = str_replace("\327", '×', $string);
176 $string = str_replace("\330", 'Ø', $string);
177 $string = str_replace("\331", 'Ù', $string);
178 $string = str_replace("\332", 'Ú', $string);
179 $string = str_replace("\333", 'Û', $string);
180 $string = str_replace("\334", 'Ü', $string);
181 $string = str_replace("\335", 'Ý', $string);
182 $string = str_replace("\336", 'Þ', $string);
183 $string = str_replace("\337", 'ß', $string);
184 $string = str_replace("\340", 'à', $string);
185 $string = str_replace("\341", 'á', $string);
186 $string = str_replace("\342", 'â', $string);
187 $string = str_replace("\343", 'ã', $string);
188 $string = str_replace("\344", 'ä', $string);
189 $string = str_replace("\345", 'å', $string);
190 $string = str_replace("\346", 'æ', $string);
191 $string = str_replace("\347", 'ç', $string);
192 $string = str_replace("\350", 'è', $string);
193 $string = str_replace("\351", 'é', $string);
194 $string = str_replace("\352", 'ê', $string);
195 $string = str_replace("\353", 'ë', $string);
196 $string = str_replace("\354", 'ì', $string);
197 $string = str_replace("\355", 'í', $string);
198 $string = str_replace("\356", 'î', $string);
199 $string = str_replace("\357", 'ï', $string);
200 $string = str_replace("\360", 'ð', $string);
201 $string = str_replace("\361", 'ñ', $string);
202 $string = str_replace("\362", 'ò', $string);
203 $string = str_replace("\363", 'ó', $string);
204 $string = str_replace("\364", 'ô', $string);
205 $string = str_replace("\365", 'õ', $string);
206 $string = str_replace("\366", 'ö', $string);
207 $string = str_replace("\367", '÷', $string);
208 $string = str_replace("\370", 'ø', $string);
209 $string = str_replace("\371", 'ù', $string);
210 $string = str_replace("\372", 'ú', $string);
211 $string = str_replace("\373", 'û', $string);
212 $string = str_replace("\374", 'ü', $string);
213 $string = str_replace("\375", 'ý', $string);
214 $string = str_replace("\376", 'þ', $string);
215 $string = str_replace("\377", 'ÿ', $string);
222 /* iso-8859-2 is used for some eastern European languages */
223 function charset_decode_iso_8859_2 ($string) {
224 global $default_charset;
226 if (strtolower($default_charset) == 'iso-8859-2')
229 /* Only do the slow convert if there are 8-bit characters */
230 if (! ereg("[\200-\377]", $string))
234 $string = str_replace("\240", ' ', $string);
235 /* LATIN CAPITAL LETTER A WITH OGONEK */
236 $string = str_replace("\241", 'Ą', $string);
238 $string = str_replace("\242", '˘', $string);
239 // LATIN CAPITAL LETTER L WITH STROKE
240 $string = str_replace("\243", 'Ł', $string);
242 $string = str_replace("\244", '¤', $string);
243 // LATIN CAPITAL LETTER L WITH CARON
244 $string = str_replace("\245", 'Ľ', $string);
245 // LATIN CAPITAL LETTER S WITH ACUTE
246 $string = str_replace("\246", 'Ś', $string);
248 $string = str_replace("\247", '§', $string);
250 $string = str_replace("\250", '¨', $string);
251 // LATIN CAPITAL LETTER S WITH CARON
252 $string = str_replace("\251", 'Š', $string);
253 // LATIN CAPITAL LETTER S WITH CEDILLA
254 $string = str_replace("\252", 'Ş', $string);
255 // LATIN CAPITAL LETTER T WITH CARON
256 $string = str_replace("\253", 'Ť', $string);
257 // LATIN CAPITAL LETTER Z WITH ACUTE
258 $string = str_replace("\254", 'Ź', $string);
260 $string = str_replace("\255", '­', $string);
261 // LATIN CAPITAL LETTER Z WITH CARON
262 $string = str_replace("\256", 'Ž', $string);
263 // LATIN CAPITAL LETTER Z WITH DOT ABOVE
264 $string = str_replace("\257", 'Ż', $string);
266 $string = str_replace("\260", '°', $string);
267 // LATIN SMALL LETTER A WITH OGONEK
268 $string = str_replace("\261", 'ą', $string);
270 $string = str_replace("\262", '˛', $string);
271 // LATIN SMALL LETTER L WITH STROKE
272 $string = str_replace("\263", 'ł', $string);
274 $string = str_replace("\264", '´', $string);
275 // LATIN SMALL LETTER L WITH CARON
276 $string = str_replace("\265", 'ľ', $string);
277 // LATIN SMALL LETTER S WITH ACUTE
278 $string = str_replace("\266", 'ś', $string);
280 $string = str_replace("\267", 'ˇ', $string);
282 $string = str_replace("\270", '¸', $string);
283 // LATIN SMALL LETTER S WITH CARON
284 $string = str_replace("\271", 'š', $string);
285 // LATIN SMALL LETTER S WITH CEDILLA
286 $string = str_replace("\272", 'ş', $string);
287 // LATIN SMALL LETTER T WITH CARON
288 $string = str_replace("\273", 'ť', $string);
289 // LATIN SMALL LETTER Z WITH ACUTE
290 $string = str_replace("\274", 'ź', $string);
291 // DOUBLE ACUTE ACCENT
292 $string = str_replace("\275", '˝', $string);
293 // LATIN SMALL LETTER Z WITH CARON
294 $string = str_replace("\276", 'ž', $string);
295 // LATIN SMALL LETTER Z WITH DOT ABOVE
296 $string = str_replace("\277", 'ż', $string);
297 // LATIN CAPITAL LETTER R WITH ACUTE
298 $string = str_replace("\300", 'Ŕ', $string);
299 // LATIN CAPITAL LETTER A WITH ACUTE
300 $string = str_replace("\301", 'Á', $string);
301 // LATIN CAPITAL LETTER A WITH CIRCUMFLEX
302 $string = str_replace("\302", 'Â', $string);
303 // LATIN CAPITAL LETTER A WITH BREVE
304 $string = str_replace("\303", 'Ă', $string);
305 // LATIN CAPITAL LETTER A WITH DIAERESIS
306 $string = str_replace("\304", 'Ä', $string);
307 // LATIN CAPITAL LETTER L WITH ACUTE
308 $string = str_replace("\305", 'Ĺ', $string);
309 // LATIN CAPITAL LETTER C WITH ACUTE
310 $string = str_replace("\306", 'Ć', $string);
311 // LATIN CAPITAL LETTER C WITH CEDILLA
312 $string = str_replace("\307", 'Ç', $string);
313 // LATIN CAPITAL LETTER C WITH CARON
314 $string = str_replace("\310", 'Č', $string);
315 // LATIN CAPITAL LETTER E WITH ACUTE
316 $string = str_replace("\311", 'É', $string);
317 // LATIN CAPITAL LETTER E WITH OGONEK
318 $string = str_replace("\312", 'Ę', $string);
319 // LATIN CAPITAL LETTER E WITH DIAERESIS
320 $string = str_replace("\313", 'Ë', $string);
321 // LATIN CAPITAL LETTER E WITH CARON
322 $string = str_replace("\314", 'Ě', $string);
323 // LATIN CAPITAL LETTER I WITH ACUTE
324 $string = str_replace("\315", 'Í', $string);
325 // LATIN CAPITAL LETTER I WITH CIRCUMFLEX
326 $string = str_replace("\316", 'Î', $string);
327 // LATIN CAPITAL LETTER D WITH CARON
328 $string = str_replace("\317", 'Ď', $string);
329 // LATIN CAPITAL LETTER D WITH STROKE
330 $string = str_replace("\320", 'Đ', $string);
331 // LATIN CAPITAL LETTER N WITH ACUTE
332 $string = str_replace("\321", 'Ń', $string);
333 // LATIN CAPITAL LETTER N WITH CARON
334 $string = str_replace("\322", 'Ň', $string);
335 // LATIN CAPITAL LETTER O WITH ACUTE
336 $string = str_replace("\323", 'Ó', $string);
337 // LATIN CAPITAL LETTER O WITH CIRCUMFLEX
338 $string = str_replace("\324", 'Ô', $string);
339 // LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
340 $string = str_replace("\325", 'Ő', $string);
341 // LATIN CAPITAL LETTER O WITH DIAERESIS
342 $string = str_replace("\326", 'Ö', $string);
343 // MULTIPLICATION SIGN
344 $string = str_replace("\327", '×', $string);
345 // LATIN CAPITAL LETTER R WITH CARON
346 $string = str_replace("\330", 'Ř', $string);
347 // LATIN CAPITAL LETTER U WITH RING ABOVE
348 $string = str_replace("\331", 'Ů', $string);
349 // LATIN CAPITAL LETTER U WITH ACUTE
350 $string = str_replace("\332", 'Ú', $string);
351 // LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
352 $string = str_replace("\333", 'Ű', $string);
353 // LATIN CAPITAL LETTER U WITH DIAERESIS
354 $string = str_replace("\334", 'Ü', $string);
355 // LATIN CAPITAL LETTER Y WITH ACUTE
356 $string = str_replace("\335", 'Ý', $string);
357 // LATIN CAPITAL LETTER T WITH CEDILLA
358 $string = str_replace("\336", 'Ţ', $string);
359 // LATIN SMALL LETTER SHARP S
360 $string = str_replace("\337", 'ß', $string);
361 // LATIN SMALL LETTER R WITH ACUTE
362 $string = str_replace("\340", 'ŕ', $string);
363 // LATIN SMALL LETTER A WITH ACUTE
364 $string = str_replace("\341", 'á', $string);
365 // LATIN SMALL LETTER A WITH CIRCUMFLEX
366 $string = str_replace("\342", 'â', $string);
367 // LATIN SMALL LETTER A WITH BREVE
368 $string = str_replace("\343", 'ă', $string);
369 // LATIN SMALL LETTER A WITH DIAERESIS
370 $string = str_replace("\344", 'ä', $string);
371 // LATIN SMALL LETTER L WITH ACUTE
372 $string = str_replace("\345", 'ĺ', $string);
373 // LATIN SMALL LETTER C WITH ACUTE
374 $string = str_replace("\346", 'ć', $string);
375 // LATIN SMALL LETTER C WITH CEDILLA
376 $string = str_replace("\347", 'ç', $string);
377 // LATIN SMALL LETTER C WITH CARON
378 $string = str_replace("\350", 'č', $string);
379 // LATIN SMALL LETTER E WITH ACUTE
380 $string = str_replace("\351", 'é', $string);
381 // LATIN SMALL LETTER E WITH OGONEK
382 $string = str_replace("\352", 'ę', $string);
383 // LATIN SMALL LETTER E WITH DIAERESIS
384 $string = str_replace("\353", 'ë', $string);
385 // LATIN SMALL LETTER E WITH CARON
386 $string = str_replace("\354", 'ě', $string);
387 // LATIN SMALL LETTER I WITH ACUTE
388 $string = str_replace("\355", 'í', $string);
389 // LATIN SMALL LETTER I WITH CIRCUMFLEX
390 $string = str_replace("\356", 'î', $string);
391 // LATIN SMALL LETTER D WITH CARON
392 $string = str_replace("\357", 'ď', $string);
393 // LATIN SMALL LETTER D WITH STROKE
394 $string = str_replace("\360", 'đ', $string);
395 // LATIN SMALL LETTER N WITH ACUTE
396 $string = str_replace("\361", 'ń', $string);
397 // LATIN SMALL LETTER N WITH CARON
398 $string = str_replace("\362", 'ň', $string);
399 // LATIN SMALL LETTER O WITH ACUTE
400 $string = str_replace("\363", 'ó', $string);
401 // LATIN SMALL LETTER O WITH CIRCUMFLEX
402 $string = str_replace("\364", 'ô', $string);
403 // LATIN SMALL LETTER O WITH DOUBLE ACUTE
404 $string = str_replace("\365", 'ő', $string);
405 // LATIN SMALL LETTER O WITH DIAERESIS
406 $string = str_replace("\366", 'ö', $string);
408 $string = str_replace("\367", '÷', $string);
409 // LATIN SMALL LETTER R WITH CARON
410 $string = str_replace("\370", 'ř', $string);
411 // LATIN SMALL LETTER U WITH RING ABOVE
412 $string = str_replace("\371", 'ů', $string);
413 // LATIN SMALL LETTER U WITH ACUTE
414 $string = str_replace("\372", 'ú', $string);
415 // LATIN SMALL LETTER U WITH DOUBLE ACUTE
416 $string = str_replace("\373", 'ű', $string);
417 // LATIN SMALL LETTER U WITH DIAERESIS
418 $string = str_replace("\374", 'ü', $string);
419 // LATIN SMALL LETTER Y WITH ACUTE
420 $string = str_replace("\375", 'ý', $string);
421 // LATIN SMALL LETTER T WITH CEDILLA
422 $string = str_replace("\376", 'ţ', $string);
424 $string = str_replace("\377", '˙', $string);
430 ISO/IEC 8859-4:1998 Latin Alphabet No. 4
433 function charset_decode_iso_8859_4 ($string) {
434 global $default_charset;
436 if (strtolower($default_charset) == 'iso-8859-4')
439 /* Only do the slow convert if there are 8-bit characters */
440 if (! ereg("[\200-\377]", $string))
443 $string = str_replace ("\241", 'Ą', $string);
444 $string = str_replace ("\242", 'ĸ', $string);
445 $string = str_replace ("\243", 'Ŗ', $string);
446 $string = str_replace ("\245", 'Ĩ', $string);
447 $string = str_replace ("\246", 'Ļ', $string);
448 $string = str_replace ("\251", 'Š', $string);
449 $string = str_replace ("\252", 'Ē', $string);
450 $string = str_replace ("\253", 'Ģ', $string);
451 $string = str_replace ("\254", 'Ŧ', $string);
452 $string = str_replace ("\256", 'Ž', $string);
453 $string = str_replace ("\261", 'ą', $string);
454 $string = str_replace ("\262", '˛', $string);
455 $string = str_replace ("\263", 'ŗ', $string);
456 $string = str_replace ("\265", 'ĩ', $string);
457 $string = str_replace ("\266", 'ļ', $string);
458 $string = str_replace ("\267", 'ˇ', $string);
459 $string = str_replace ("\271", 'š', $string);
460 $string = str_replace ("\272", 'ē', $string);
461 $string = str_replace ("\273", 'ģ', $string);
462 $string = str_replace ("\274", 'ŧ', $string);
463 $string = str_replace ("\275", 'Ŋ', $string);
464 $string = str_replace ("\276", 'ž', $string);
465 $string = str_replace ("\277", 'ŋ', $string);
466 $string = str_replace ("\300", 'Ā', $string);
467 $string = str_replace ("\307", 'Į', $string);
468 $string = str_replace ("\310", 'Č', $string);
469 $string = str_replace ("\312", 'Ę', $string);
470 $string = str_replace ("\314", 'Ė', $string);
471 $string = str_replace ("\317", 'Ī', $string);
472 $string = str_replace ("\320", 'Đ', $string);
473 $string = str_replace ("\321", 'Ņ', $string);
474 $string = str_replace ("\322", 'Ō', $string);
475 $string = str_replace ("\323", 'Ķ', $string);
476 $string = str_replace ("\331", 'Ų', $string);
477 $string = str_replace ("\335", 'Ũ', $string);
478 $string = str_replace ("\336", 'Ū', $string);
479 $string = str_replace ("\340", 'ā', $string);
480 $string = str_replace ("\347", 'į', $string);
481 $string = str_replace ("\350", 'č', $string);
482 $string = str_replace ("\352", 'ę', $string);
483 $string = str_replace ("\354", 'ė', $string);
484 $string = str_replace ("\357", 'ī', $string);
485 $string = str_replace ("\360", 'đ', $string);
486 $string = str_replace ("\361", 'ņ', $string);
487 $string = str_replace ("\362", 'ō', $string);
488 $string = str_replace ("\363", 'ķ', $string);
489 $string = str_replace ("\371", 'ų', $string);
490 $string = str_replace ("\375", 'ũ', $string);
491 $string = str_replace ("\376", 'ū', $string);
492 $string = str_replace ("\377", '˙', $string);
494 // rest of charset is the same as ISO-8859-1
495 return (charset_decode_iso_8859_1($string));
498 /* ISO-8859-5 is Cyrillic */
499 function charset_decode_iso_8859_5 ($string) {
500 global $default_charset;
502 if (strtolower($default_charset) == 'iso-8859-5') {
506 /* Only do the slow convert if there are 8-bit characters */
507 if (! ereg("[\200-\377]", $string))
511 $string = str_replace("\240", ' ', $string);
512 // 161-172 -> 1025-1036 (+864)
513 $string = preg_replace("/([\241-\254])/e","'&#' . (ord('\\1')+864) . ';'",$string);
515 $string = str_replace("\255", '­', $string);
516 // 174-239 -> 1038-1103 (+864)
517 $string = preg_replace("/([\256-\357])/e","'&#' . (ord('\\1')+864) . ';'",$string);
519 $string = str_replace("\360", '№', $string);
520 // 241-252 -> 1105-1116 (+864)
521 $string = preg_replace("/([\361-\374])/e","'&#' . (ord('\\1')+864) . ';'",$string);
523 $string = str_replace("\375", '§', $string);
524 // CYRILLIC SMALL LETTER SHORT U (Byelorussian)
525 $string = str_replace("\376", 'ў', $string);
526 // CYRILLIC SMALL LETTER DZHE
527 $string = str_replace("\377", 'џ', $string);
532 /* iso-8859-7 is Greek. */
533 function charset_decode_iso_8859_7 ($string) {
534 global $default_charset;
536 if (strtolower($default_charset) == 'iso-8859-7') {
540 /* Only do the slow convert if there are 8-bit characters */
541 if (!ereg("[\200-\377]", $string)) {
545 /* Some diverse characters in the beginning */
546 $string = str_replace("\240", ' ', $string);
547 $string = str_replace("\241", '‘', $string);
548 $string = str_replace("\242", '’', $string);
549 $string = str_replace("\243", '£', $string);
550 $string = str_replace("\246", '¦', $string);
551 $string = str_replace("\247", '§', $string);
552 $string = str_replace("\250", '¨', $string);
553 $string = str_replace("\251", '©', $string);
554 $string = str_replace("\253", '«', $string);
555 $string = str_replace("\254", '¬', $string);
556 $string = str_replace("\255", '­', $string);
557 $string = str_replace("\257", '―', $string);
558 $string = str_replace("\260", '°', $string);
559 $string = str_replace("\261", '±', $string);
560 $string = str_replace("\262", '²', $string);
561 $string = str_replace("\263", '³', $string);
563 /* Horizontal bar (parentheki pavla) */
564 $string = str_replace ("\257", '―', $string);
567 * ISO-8859-7 characters from 11/04 (0xB4) to 11/06 (0xB6)
568 * These are Unicode 900-902
570 $string = preg_replace("/([\264-\266])/e","'&#' . (ord('\\1')+720);",$string);
572 /* 11/07 (0xB7) Middle dot is the same in iso-8859-1 */
573 $string = str_replace("\267", '·', $string);
576 * ISO-8859-7 characters from 11/08 (0xB8) to 11/10 (0xBA)
577 * These are Unicode 900-902
579 $string = preg_replace("/([\270-\272])/e","'&#' . (ord('\\1')+720);",$string);
582 * 11/11 (0xBB) Right angle quotation mark is the same as in
585 $string = str_replace("\273", '»', $string);
587 /* And now the rest of the charset */
588 $string = preg_replace("/([\274-\376])/e","'&#'.(ord('\\1')+720);",$string);
594 ISOIEC 8859-9:1999 Latin Alphabet No. 5
597 function charset_decode_iso_8859_9 ($string) {
598 global $default_charset;
600 if (strtolower($default_charset) == 'iso-8859-9')
603 /* Only do the slow convert if there are 8-bit characters */
604 if (! ereg("[\200-\377]", $string))
607 // latin capital letter g with breve 208->286
608 $string = str_replace("\320", 'Ğ', $string);
609 // latin capital letter i with dot above 221->304
610 $string = str_replace("\335", 'İ', $string);
611 // latin capital letter s with cedilla 222->350
612 $string = str_replace("\336", 'Ş', $string);
613 // latin small letter g with breve 240->287
614 $string = str_replace("\360", 'ğ', $string);
615 // latin small letter dotless i 253->305
616 $string = str_replace("\375", 'ı', $string);
617 // latin small letter s with cedilla 254->351
618 $string = str_replace("\376", 'ş', $string);
620 // rest of charset is the same as ISO-8859-1
621 return (charset_decode_iso_8859_1($string));
626 ISO/IEC 8859-13:1998 Latin Alphabet No. 7 (Baltic Rim)
628 function charset_decode_iso_8859_13 ($string) {
629 global $default_charset;
631 if (strtolower($default_charset) == 'iso-8859-13')
634 /* Only do the slow convert if there are 8-bit characters */
635 if (! ereg("[\200-\377]", $string))
638 $string = str_replace ("\241", '”', $string);
639 $string = str_replace ("\245", '„', $string);
640 $string = str_replace ("\250", 'Ø', $string);
641 $string = str_replace ("\252", 'Ŗ', $string);
642 $string = str_replace ("\257", 'Æ', $string);
643 $string = str_replace ("\264", '“', $string);
644 $string = str_replace ("\270", 'ø', $string);
645 $string = str_replace ("\272", 'ŗ', $string);
646 $string = str_replace ("\277", 'æ', $string);
647 $string = str_replace ("\300", 'Ą', $string);
648 $string = str_replace ("\301", 'Į', $string);
649 $string = str_replace ("\302", 'Ā', $string);
650 $string = str_replace ("\303", 'Ć', $string);
651 $string = str_replace ("\306", 'Ę', $string);
652 $string = str_replace ("\307", 'Ē', $string);
653 $string = str_replace ("\310", 'Č', $string);
654 $string = str_replace ("\312", 'Ź', $string);
655 $string = str_replace ("\313", 'Ė', $string);
656 $string = str_replace ("\314", 'Ģ', $string);
657 $string = str_replace ("\315", 'Ķ', $string);
658 $string = str_replace ("\316", 'Ī', $string);
659 $string = str_replace ("\317", 'Ļ', $string);
660 $string = str_replace ("\320", 'Š', $string);
661 $string = str_replace ("\321", 'Ń', $string);
662 $string = str_replace ("\322", 'Ņ', $string);
663 $string = str_replace ("\324", 'Ō', $string);
664 $string = str_replace ("\330", 'Ų', $string);
665 $string = str_replace ("\331", 'Ł', $string);
666 $string = str_replace ("\332", 'Ś', $string);
667 $string = str_replace ("\333", 'Ū', $string);
668 $string = str_replace ("\335", 'Ż', $string);
669 $string = str_replace ("\336", 'Ž', $string);
670 $string = str_replace ("\340", 'ą', $string);
671 $string = str_replace ("\341", 'į', $string);
672 $string = str_replace ("\342", 'ā', $string);
673 $string = str_replace ("\343", 'ć', $string);
674 $string = str_replace ("\346", 'ę', $string);
675 $string = str_replace ("\347", 'ē', $string);
676 $string = str_replace ("\350", 'č', $string);
677 $string = str_replace ("\352", 'ź', $string);
678 $string = str_replace ("\353", 'ė', $string);
679 $string = str_replace ("\354", 'ģ', $string);
680 $string = str_replace ("\355", 'ķ', $string);
681 $string = str_replace ("\356", 'ī', $string);
682 $string = str_replace ("\357", 'ļ', $string);
683 $string = str_replace ("\360", 'š', $string);
684 $string = str_replace ("\361", 'ń', $string);
685 $string = str_replace ("\362", 'ņ', $string);
686 $string = str_replace ("\364", 'ō', $string);
687 $string = str_replace ("\370", 'ų', $string);
688 $string = str_replace ("\371", 'ł', $string);
689 $string = str_replace ("\372", 'ś', $string);
690 $string = str_replace ("\373", 'ū', $string);
691 $string = str_replace ("\375", 'ż', $string);
692 $string = str_replace ("\376", 'ž', $string);
693 $string = str_replace ("\377", '’', $string);
695 // rest of charset is the same as ISO-8859-1
696 return (charset_decode_iso_8859_1($string));
700 * iso-8859-15 is Latin 9 and has very much the same use as Latin 1
701 * but has the Euro symbol and some characters needed for French.
703 function charset_decode_iso_8859_15 ($string) {
705 $string = str_replace ("\244", '€', $string);
706 // Latin capital letter S with caron
707 $string = str_replace ("\246", 'Š', $string);
708 // Latin small letter s with caron
709 $string = str_replace ("\250", 'š', $string);
710 // Latin capital letter Z with caron
711 $string = str_replace ("\264", 'Ž', $string);
712 // Latin small letter z with caron
713 $string = str_replace ("\270", 'ž', $string);
714 // Latin capital ligature OE
715 $string = str_replace ("\274", 'Œ', $string);
716 // Latin small ligature oe
717 $string = str_replace ("\275", 'œ', $string);
718 // Latin capital letter Y with diaeresis
719 $string = str_replace ("\276", 'Ÿ', $string);
721 return (charset_decode_iso_8859_1($string));
725 /* Remove all 8 bit characters from all other ISO-8859 character sets */
726 function charset_decode_iso_8859_default ($string) {
727 return (strtr($string, "\240\241\242\243\244\245\246\247".
728 "\250\251\252\253\254\255\256\257".
729 "\260\261\262\263\264\265\266\267".
730 "\270\271\272\273\274\275\276\277".
731 "\300\301\302\303\304\305\306\307".
732 "\310\311\312\313\314\315\316\317".
733 "\320\321\322\323\324\325\326\327".
734 "\330\331\332\333\334\335\336\337".
735 "\340\341\342\343\344\345\346\347".
736 "\350\351\352\353\354\355\356\357".
737 "\360\361\362\363\364\365\366\367".
738 "\370\371\372\373\374\375\376\377",
739 "????????????????????????????????????????".
740 "????????????????????????????????????????".
741 "????????????????????????????????????????".
747 * This is the same as ISO-646-NO and is used by some
748 * Microsoft programs when sending Norwegian characters
750 function charset_decode_ns_4551_1 ($string) {
752 * These characters are:
753 * Latin capital letter AE
754 * Latin capital letter O with stroke
755 * Latin capital letter A with ring above
756 * and the same as small letters
758 return strtr ($string, "[\\]{|}", "ÆØÅæøå");
762 * KOI8-R is used to encode Russian mail (Cyrrilic). Defined in RFC
765 function charset_decode_koi8r ($string) {
766 global $default_charset;
768 if ($default_charset == 'koi8-r') {
773 * Convert to Unicode HTML entities.
774 * This code is rather ineffective.
776 $string = str_replace("\200", '─', $string);
777 $string = str_replace("\201", '│', $string);
778 $string = str_replace("\202", '┌', $string);
779 $string = str_replace("\203", '┐', $string);
780 $string = str_replace("\204", '└', $string);
781 $string = str_replace("\205", '┘', $string);
782 $string = str_replace("\206", '├', $string);
783 $string = str_replace("\207", '┤', $string);
784 $string = str_replace("\210", '┬', $string);
785 $string = str_replace("\211", '┴', $string);
786 $string = str_replace("\212", '┼', $string);
787 $string = str_replace("\213", '▀', $string);
788 $string = str_replace("\214", '▄', $string);
789 $string = str_replace("\215", '█', $string);
790 $string = str_replace("\216", '▌', $string);
791 $string = str_replace("\217", '▐', $string);
792 $string = str_replace("\220", '░', $string);
793 $string = str_replace("\221", '▒', $string);
794 $string = str_replace("\222", '▓', $string);
795 $string = str_replace("\223", '⌠', $string);
796 $string = str_replace("\224", '■', $string);
797 $string = str_replace("\225", '∙', $string);
798 $string = str_replace("\226", '√', $string);
799 $string = str_replace("\227", '≈', $string);
800 $string = str_replace("\230", '≤', $string);
801 $string = str_replace("\231", '≥', $string);
802 $string = str_replace("\232", ' ', $string);
803 $string = str_replace("\233", '⌡', $string);
804 $string = str_replace("\234", '°', $string);
805 $string = str_replace("\235", '²', $string);
806 $string = str_replace("\236", '·', $string);
807 $string = str_replace("\237", '÷', $string);
808 $string = str_replace("\240", '═', $string);
809 $string = str_replace("\241", '║', $string);
810 $string = str_replace("\242", '╒', $string);
811 $string = str_replace("\243", 'ё', $string);
812 $string = str_replace("\244", '╓', $string);
813 $string = str_replace("\245", '╔', $string);
814 $string = str_replace("\246", '╕', $string);
815 $string = str_replace("\247", '╖', $string);
816 $string = str_replace("\250", '╗', $string);
817 $string = str_replace("\251", '╘', $string);
818 $string = str_replace("\252", '╙', $string);
819 $string = str_replace("\253", '╚', $string);
820 $string = str_replace("\254", '╛', $string);
821 $string = str_replace("\255", '╜', $string);
822 $string = str_replace("\256", '╝', $string);
823 $string = str_replace("\257", '╞', $string);
824 $string = str_replace("\260", '╟', $string);
825 $string = str_replace("\261", '╠', $string);
826 $string = str_replace("\262", '╡', $string);
827 $string = str_replace("\263", 'Ё', $string);
828 $string = str_replace("\264", '╢', $string);
829 $string = str_replace("\265", '╣', $string);
830 $string = str_replace("\266", '╤', $string);
831 $string = str_replace("\267", '╥', $string);
832 $string = str_replace("\270", '╦', $string);
833 $string = str_replace("\271", '╧', $string);
834 $string = str_replace("\272", '╨', $string);
835 $string = str_replace("\273", '╩', $string);
836 $string = str_replace("\274", '╪', $string);
837 $string = str_replace("\275", '╫', $string);
838 $string = str_replace("\276", '╬', $string);
839 $string = str_replace("\277", '©', $string);
840 $string = str_replace("\300", 'ю', $string);
841 $string = str_replace("\301", 'а', $string);
842 $string = str_replace("\302", 'б', $string);
843 $string = str_replace("\303", 'ц', $string);
844 $string = str_replace("\304", 'д', $string);
845 $string = str_replace("\305", 'е', $string);
846 $string = str_replace("\306", 'ф', $string);
847 $string = str_replace("\307", 'г', $string);
848 $string = str_replace("\310", 'х', $string);
849 $string = str_replace("\311", 'и', $string);
850 $string = str_replace("\312", 'й', $string);
851 $string = str_replace("\313", 'к', $string);
852 $string = str_replace("\314", 'л', $string);
853 $string = str_replace("\315", 'м', $string);
854 $string = str_replace("\316", 'н', $string);
855 $string = str_replace("\317", 'о', $string);
856 $string = str_replace("\320", 'п', $string);
857 $string = str_replace("\321", 'я', $string);
858 $string = str_replace("\322", 'р', $string);
859 $string = str_replace("\323", 'с', $string);
860 $string = str_replace("\324", 'т', $string);
861 $string = str_replace("\325", 'у', $string);
862 $string = str_replace("\326", 'ж', $string);
863 $string = str_replace("\327", 'в', $string);
864 $string = str_replace("\330", 'ь', $string);
865 $string = str_replace("\331", 'ы', $string);
866 $string = str_replace("\332", 'з', $string);
867 $string = str_replace("\333", 'ш', $string);
868 $string = str_replace("\334", 'э', $string);
869 $string = str_replace("\335", 'щ', $string);
870 $string = str_replace("\336", 'ч', $string);
871 $string = str_replace("\337", 'ъ', $string);
872 $string = str_replace("\340", 'Ю', $string);
873 $string = str_replace("\341", 'А', $string);
874 $string = str_replace("\342", 'Б', $string);
875 $string = str_replace("\343", 'Ц', $string);
876 $string = str_replace("\344", 'Д', $string);
877 $string = str_replace("\345", 'Е', $string);
878 $string = str_replace("\346", 'Ф', $string);
879 $string = str_replace("\347", 'Г', $string);
880 $string = str_replace("\350", 'Х', $string);
881 $string = str_replace("\351", 'И', $string);
882 $string = str_replace("\352", 'Й', $string);
883 $string = str_replace("\353", 'К', $string);
884 $string = str_replace("\354", 'Л', $string);
885 $string = str_replace("\355", 'М', $string);
886 $string = str_replace("\356", 'Н', $string);
887 $string = str_replace("\357", 'О', $string);
888 $string = str_replace("\360", 'П', $string);
889 $string = str_replace("\361", 'Я', $string);
890 $string = str_replace("\362", 'Р', $string);
891 $string = str_replace("\363", 'С', $string);
892 $string = str_replace("\364", 'Т', $string);
893 $string = str_replace("\365", 'У', $string);
894 $string = str_replace("\366", 'Ж', $string);
895 $string = str_replace("\367", 'В', $string);
896 $string = str_replace("\370", 'Ь', $string);
897 $string = str_replace("\371", 'Ы', $string);
898 $string = str_replace("\372", 'З', $string);
899 $string = str_replace("\373", 'Ш', $string);
900 $string = str_replace("\374", 'Э', $string);
901 $string = str_replace("\375", 'Щ', $string);
902 $string = str_replace("\376", 'Ч', $string);
903 $string = str_replace("\377", 'Ъ', $string);
909 * KOI8-U is used to encode Ukrainian mail (Cyrrilic). Defined in RFC
912 function charset_decode_koi8u ($string) {
913 global $default_charset;
915 if (strtolower($default_charset) == 'koi8-u') {
919 /* Only do the slow convert if there are 8-bit characters */
920 if (! ereg("[\200-\377]", $string))
923 // BOX DRAWINGS LIGHT HORIZONTAL
924 $string = str_replace("\200", '─', $string);
925 // BOX DRAWINGS LIGHT VERTICAL
926 $string = str_replace("\201", '│', $string);
927 // BOX DRAWINGS LIGHT DOWN AND RIGHT
928 $string = str_replace("\202", '┌', $string);
929 // BOX DRAWINGS LIGHT DOWN AND LEFT
930 $string = str_replace("\203", '┐', $string);
931 // BOX DRAWINGS LIGHT UP AND RIGHT
932 $string = str_replace("\204", '└', $string);
933 // BOX DRAWINGS LIGHT UP AND LEFT
934 $string = str_replace("\205", '┘', $string);
935 // BOX DRAWINGS LIGHT VERTICAL AND RIGHT
936 $string = str_replace("\206", '├', $string);
937 // BOX DRAWINGS LIGHT VERTICAL AND LEFT
938 $string = str_replace("\207", '┤', $string);
939 // BOX DRAWINGS LIGHT DOWN AND HORIZONTAL
940 $string = str_replace("\210", '┬', $string);
941 // BOX DRAWINGS LIGHT UP AND HORIZONTAL
942 $string = str_replace("\211", '┴', $string);
943 // BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL
944 $string = str_replace("\212", '┼', $string);
946 $string = str_replace("\213", '▀', $string);
948 $string = str_replace("\214", '▄', $string);
950 $string = str_replace("\215", '█', $string);
952 $string = str_replace("\216", '▌', $string);
954 $string = str_replace("\217", '▐', $string);
956 $string = str_replace("\220", '░', $string);
958 $string = str_replace("\221", '▒', $string);
960 $string = str_replace("\222", '▓', $string);
962 $string = str_replace("\223", '⌠', $string);
964 $string = str_replace("\224", '■', $string);
966 $string = str_replace("\225", '∙', $string);
968 $string = str_replace("\226", '√', $string);
970 $string = str_replace("\227", '≈', $string);
971 // LESS THAN OR EQUAL TO
972 $string = str_replace("\230", '≤', $string);
973 // GREATER THAN OR EQUAL TO
974 $string = str_replace("\231", '≥', $string);
976 $string = str_replace("\232", ' ', $string);
977 // BOTTOM HALF INTEGRAL
978 $string = str_replace("\233", '⌡', $string);
980 $string = str_replace("\234", '°', $string);
981 // SUPERSCRIPT DIGIT TWO
982 $string = str_replace("\235", '²', $string);
984 $string = str_replace("\236", '·', $string);
986 $string = str_replace("\237", '÷', $string);
987 // BOX DRAWINGS DOUBLE HORIZONTAL
988 $string = str_replace("\240", '═', $string);
989 // BOX DRAWINGS DOUBLE VERTICAL
990 $string = str_replace("\241", '║', $string);
991 // BOX DRAWINGS DOWN SINGLE AND RIGHT DOUBLE
992 $string = str_replace("\242", '╒', $string);
993 // CYRILLIC SMALL LETTER IO
994 $string = str_replace("\243", 'ё', $string);
995 // CYRILLIC SMALL LETTER UKRAINIAN IE
996 $string = str_replace("\244", 'є', $string);
997 // BOX DRAWINGS DOUBLE DOWN AND RIGHT
998 $string = str_replace("\245", '╔', $string);
999 // CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
1000 $string = str_replace("\246", 'і', $string);
1001 // CYRILLIC SMALL LETTER YI (Ukrainian)
1002 $string = str_replace("\247", 'ї', $string);
1003 // BOX DRAWINGS DOUBLE DOWN AND LEFT
1004 $string = str_replace("\250", '╗', $string);
1005 // BOX DRAWINGS UP SINGLE AND RIGHT DOUBLE
1006 $string = str_replace("\251", '╘', $string);
1007 // BOX DRAWINGS UP DOUBLE AND RIGHT SINGLE
1008 $string = str_replace("\252", '╙', $string);
1009 // BOX DRAWINGS DOUBLE UP AND RIGHT
1010 $string = str_replace("\253", '╚', $string);
1011 // BOX DRAWINGS UP SINGLE AND LEFT DOUBLE
1012 $string = str_replace("\254", '╛', $string);
1013 // CYRILLIC SMALL LETTER GHE WITH UPTURN
1014 $string = str_replace("\255", 'ґ', $string);
1015 // BOX DRAWINGS DOUBLE UP AND LEFT
1016 $string = str_replace("\256", '╝', $string);
1017 // BOX DRAWINGS VERTICAL SINGLE AND RIGHT DOUBLE
1018 $string = str_replace("\257", '╞', $string);
1019 // BOX DRAWINGS VERTICAL DOUBLE AND RIGHT SINGLE
1020 $string = str_replace("\260", '╟', $string);
1021 // BOX DRAWINGS DOUBLE VERTICAL AND RIGHT
1022 $string = str_replace("\261", '╠', $string);
1023 // BOX DRAWINGS VERTICAL SINGLE AND LEFT DOUBLE
1024 $string = str_replace("\262", '╡', $string);
1025 // CYRILLIC CAPITAL LETTER IO
1026 $string = str_replace("\263", 'Ё', $string);
1027 // CYRILLIC CAPITAL LETTER UKRAINIAN IE
1028 $string = str_replace("\264", 'Є', $string);
1029 // DOUBLE VERTICAL AND LEFT
1030 $string = str_replace("\265", '╣', $string);
1031 // CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
1032 $string = str_replace("\266", 'І', $string);
1033 // CYRILLIC CAPITAL LETTER YI (Ukrainian)
1034 $string = str_replace("\267", 'Ї', $string);
1035 // BOX DRAWINGS DOUBLE DOWN AND HORIZONTAL
1036 $string = str_replace("\270", '╦', $string);
1037 // BOX DRAWINGS UP SINGLE AND HORIZONTAL DOUBLE
1038 $string = str_replace("\271", '╧', $string);
1039 // BOX DRAWINGS UP DOUBLE AND HORIZONTAL SINGLE
1040 $string = str_replace("\272", '╨', $string);
1041 // BOX DRAWINGS DOUBLE UP AND HORIZONTAL
1042 $string = str_replace("\273", '╩', $string);
1043 // BOX DRAWINGS VERTICAL SINGLE AND HORIZONTAL DOUBLE
1044 $string = str_replace("\274", '╪', $string);
1045 // CYRILLIC CAPITAL LETTER GHE WITH UPTURN
1046 $string = str_replace("\275", 'Ґ', $string);
1047 // BOX DRAWINGS DOUBLE VERTICAL AND HORIZONTAL
1048 $string = str_replace("\276", '╬', $string);
1050 $string = str_replace("\277", '©', $string);
1051 // CYRILLIC SMALL LETTER YU
1052 $string = str_replace("\300", 'ю', $string);
1053 // CYRILLIC SMALL LETTER A
1054 $string = str_replace("\301", 'а', $string);
1055 // CYRILLIC SMALL LETTER BE
1056 $string = str_replace("\302", 'б', $string);
1057 // CYRILLIC SMALL LETTER TSE
1058 $string = str_replace("\303", 'ц', $string);
1059 // CYRILLIC SMALL LETTER DE
1060 $string = str_replace("\304", 'д', $string);
1061 // CYRILLIC SMALL LETTER IE
1062 $string = str_replace("\305", 'е', $string);
1063 // CYRILLIC SMALL LETTER EF
1064 $string = str_replace("\306", 'ф', $string);
1065 // CYRILLIC SMALL LETTER GHE
1066 $string = str_replace("\307", 'г', $string);
1067 // CYRILLIC SMALL LETTER HA
1068 $string = str_replace("\310", 'х', $string);
1069 // CYRILLIC SMALL LETTER I
1070 $string = str_replace("\311", 'и', $string);
1071 // CYRILLIC SMALL LETTER SHORT I
1072 $string = str_replace("\312", 'й', $string);
1073 // CYRILLIC SMALL LETTER KA
1074 $string = str_replace("\313", 'к', $string);
1075 // CYRILLIC SMALL LETTER EL
1076 $string = str_replace("\314", 'л', $string);
1077 // CYRILLIC SMALL LETTER EM
1078 $string = str_replace("\315", 'м', $string);
1079 // CYRILLIC SMALL LETTER EN
1080 $string = str_replace("\316", 'н', $string);
1081 // CYRILLIC SMALL LETTER O
1082 $string = str_replace("\317", 'о', $string);
1083 // CYRILLIC SMALL LETTER PE
1084 $string = str_replace("\320", 'п', $string);
1085 // CYRILLIC SMALL LETTER YA
1086 $string = str_replace("\321", 'я', $string);
1087 // CYRILLIC SMALL LETTER ER
1088 $string = str_replace("\322", 'р', $string);
1089 // CYRILLIC SMALL LETTER ES
1090 $string = str_replace("\323", 'с', $string);
1091 // CYRILLIC SMALL LETTER TE
1092 $string = str_replace("\324", 'т', $string);
1093 // CYRILLIC SMALL LETTER U
1094 $string = str_replace("\325", 'у', $string);
1095 // CYRILLIC SMALL LETTER ZHE
1096 $string = str_replace("\326", 'ж', $string);
1097 // CYRILLIC SMALL LETTER VE
1098 $string = str_replace("\327", 'в', $string);
1099 // CYRILLIC SMALL LETTER SOFT SIGN
1100 $string = str_replace("\330", 'ь', $string);
1101 // CYRILLIC SMALL LETTER YERU
1102 $string = str_replace("\331", 'ы', $string);
1103 // CYRILLIC SMALL LETTER ZE
1104 $string = str_replace("\332", 'з', $string);
1105 // CYRILLIC SMALL LETTER SHA
1106 $string = str_replace("\333", 'ш', $string);
1107 // CYRILLIC SMALL LETTER E
1108 $string = str_replace("\334", 'э', $string);
1109 // CYRILLIC SMALL LETTER SHCHA
1110 $string = str_replace("\335", 'щ', $string);
1111 // CYRILLIC SMALL LETTER CHE
1112 $string = str_replace("\336", 'ч', $string);
1113 // CYRILLIC SMALL LETTER HARD SIGN
1114 $string = str_replace("\337", 'ъ', $string);
1115 // CYRILLIC CAPITAL LETTER YU
1116 $string = str_replace("\340", 'Ю', $string);
1117 // CYRILLIC CAPITAL LETTER A
1118 $string = str_replace("\341", 'А', $string);
1119 // CYRILLIC CAPITAL LETTER BE
1120 $string = str_replace("\342", 'Б', $string);
1121 // CYRILLIC CAPITAL LETTER TSE
1122 $string = str_replace("\343", 'Ц', $string);
1123 // CYRILLIC CAPITAL LETTER DE
1124 $string = str_replace("\344", 'Д', $string);
1125 // CYRILLIC CAPITAL LETTER IE
1126 $string = str_replace("\345", 'Е', $string);
1127 // CYRILLIC CAPITAL LETTER EF
1128 $string = str_replace("\346", 'Ф', $string);
1129 // CYRILLIC CAPITAL LETTER GHE
1130 $string = str_replace("\347", 'Г', $string);
1131 // CYRILLIC CAPITAL LETTER HA
1132 $string = str_replace("\350", 'Х', $string);
1133 // CYRILLIC CAPITAL LETTER I
1134 $string = str_replace("\351", 'И', $string);
1135 // CYRILLIC CAPITAL LETTER SHORT I
1136 $string = str_replace("\352", 'Й', $string);
1137 // CYRILLIC CAPITAL LETTER KA
1138 $string = str_replace("\353", 'К', $string);
1139 // CYRILLIC CAPITAL LETTER EL
1140 $string = str_replace("\354", 'Л', $string);
1141 // CYRILLIC CAPITAL LETTER EM
1142 $string = str_replace("\355", 'М', $string);
1143 // CYRILLIC CAPITAL LETTER EN
1144 $string = str_replace("\356", 'Н', $string);
1145 // CYRILLIC CAPITAL LETTER O
1146 $string = str_replace("\357", 'О', $string);
1147 // CYRILLIC CAPITAL LETTER PE
1148 $string = str_replace("\360", 'П', $string);
1149 // CYRILLIC CAPITAL LETTER YA
1150 $string = str_replace("\361", 'Я', $string);
1151 // CYRILLIC CAPITAL LETTER ER
1152 $string = str_replace("\362", 'Р', $string);
1153 // CYRILLIC CAPITAL LETTER ES
1154 $string = str_replace("\363", 'С', $string);
1155 // CYRILLIC CAPITAL LETTER TE
1156 $string = str_replace("\364", 'Т', $string);
1157 // CYRILLIC CAPITAL LETTER U
1158 $string = str_replace("\365", 'У', $string);
1159 // CYRILLIC CAPITAL LETTER ZHE
1160 $string = str_replace("\366", 'Ж', $string);
1161 // CYRILLIC CAPITAL LETTER VE
1162 $string = str_replace("\367", 'В', $string);
1163 // CYRILLIC CAPITAL LETTER SOFT SIGN
1164 $string = str_replace("\370", 'Ь', $string);
1165 // CYRILLIC CAPITAL LETTER YERU
1166 $string = str_replace("\371", 'Ы', $string);
1167 // CYRILLIC CAPITAL LETTER ZE
1168 $string = str_replace("\372", 'З', $string);
1169 // CYRILLIC CAPITAL LETTER SHA
1170 $string = str_replace("\373", 'Ш', $string);
1171 // CYRILLIC CAPITAL LETTER E
1172 $string = str_replace("\374", 'Э', $string);
1173 // CYRILLIC CAPITAL LETTER SHCHA
1174 $string = str_replace("\375", 'Щ', $string);
1175 // CYRILLIC CAPITAL LETTER CHE
1176 $string = str_replace("\376", 'Ч', $string);
1177 // CYRILLIC CAPITAL LETTER HARD SIGN
1178 $string = str_replace("\377", 'Ъ', $string);
1184 * windows-1251 is used to encode Bulgarian mail (Cyrrilic).
1186 function charset_decode_windows_1251 ($string) {
1187 global $default_charset;
1189 if (strtolower($default_charset) == 'windows-1251') {
1193 /* Only do the slow convert if there are 8-bit characters */
1194 if (! ereg("[\200-\377]", $string))
1197 // CYRILLIC CAPITAL LETTER DJE (Serbocroatian)
1198 $string = str_replace("\200", 'Ђ', $string);
1199 // CYRILLIC CAPITAL LETTER GJE
1200 $string = str_replace("\201", 'Ѓ', $string);
1201 // SINGLE LOW-9 QUOTATION MARK
1202 $string = str_replace("\202", '‚', $string);
1203 // CYRILLIC SMALL LETTER GJE
1204 $string = str_replace("\203", 'ѓ', $string);
1205 // DOUBLE LOW-9 QUOTATION MARK
1206 $string = str_replace("\204", '„', $string);
1207 // HORIZONTAL ELLIPSIS
1208 $string = str_replace("\205", '…', $string);
1210 $string = str_replace("\206", '†', $string);
1212 $string = str_replace("\207", '‡', $string);
1214 $string = str_replace("\210", '€', $string);
1216 $string = str_replace("\211", '‰', $string);
1217 // CYRILLIC CAPITAL LETTER LJE
1218 $string = str_replace("\212", 'Љ', $string);
1219 // SINGLE LEFT-POINTING ANGLE QUOTATION MARK
1220 $string = str_replace("\213", '‹', $string);
1221 // CYRILLIC CAPITAL LETTER NJE
1222 $string = str_replace("\214", 'Њ', $string);
1223 // CYRILLIC CAPITAL LETTER KJE
1224 $string = str_replace("\215", 'Ќ', $string);
1225 // CYRILLIC CAPITAL LETTER TSHE (Serbocroatian)
1226 $string = str_replace("\216", 'Ћ', $string);
1227 // CYRILLIC CAPITAL LETTER DZHE
1228 $string = str_replace("\217", 'Џ', $string);
1229 // CYRILLIC SMALL LETTER DJE (Serbocroatian)
1230 $string = str_replace("\220", 'ђ', $string);
1231 // LEFT SINGLE QUOTATION MARK
1232 $string = str_replace("\221", '‘', $string);
1233 // RIGHT SINGLE QUOTATION MARK
1234 $string = str_replace("\222", '’', $string);
1235 // LEFT DOUBLE QUOTATION MARK
1236 $string = str_replace("\223", '“', $string);
1237 // RIGHT DOUBLE QUOTATION MARK
1238 $string = str_replace("\224", '”', $string);
1240 $string = str_replace("\225", '•', $string);
1242 $string = str_replace("\226", '–', $string);
1244 $string = str_replace("\227", '—', $string);
1246 $string = str_replace("\231", '™', $string);
1247 // CYRILLIC SMALL LETTER LJE
1248 $string = str_replace("\232", 'љ', $string);
1249 // SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
1250 $string = str_replace("\233", '›', $string);
1251 // CYRILLIC SMALL LETTER NJE
1252 $string = str_replace("\234", 'њ', $string);
1253 // CYRILLIC SMALL LETTER KJE
1254 $string = str_replace("\235", 'ќ', $string);
1255 // CYRILLIC SMALL LETTER TSHE (Serbocroatian)
1256 $string = str_replace("\236", 'ћ', $string);
1257 // CYRILLIC SMALL LETTER DZHE
1258 $string = str_replace("\237", 'џ', $string);
1260 $string = str_replace("\240", ' ', $string);
1261 // CYRILLIC CAPITAL LETTER SHORT U (Byelorussian)
1262 $string = str_replace("\241", 'Ў', $string);
1263 // CYRILLIC SMALL LETTER SHORT U (Byelorussian)
1264 $string = str_replace("\242", 'ў', $string);
1265 // CYRILLIC CAPITAL LETTER JE
1266 $string = str_replace("\243", 'Ј', $string);
1268 $string = str_replace("\244", '¤', $string);
1269 // CYRILLIC CAPITAL LETTER GHE WITH UPTURN
1270 $string = str_replace("\245", 'Ґ', $string);
1272 $string = str_replace("\246", '¦', $string);
1274 $string = str_replace("\247", '§', $string);
1275 // CYRILLIC CAPITAL LETTER IO
1276 $string = str_replace("\250", 'Ё', $string);
1278 $string = str_replace("\251", '©', $string);
1279 // CYRILLIC CAPITAL LETTER UKRAINIAN IE
1280 $string = str_replace("\252", 'Є', $string);
1281 // LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
1282 $string = str_replace("\253", '«', $string);
1284 $string = str_replace("\254", '¬', $string);
1286 $string = str_replace("\255", '­', $string);
1288 $string = str_replace("\256", '®', $string);
1289 // CYRILLIC CAPITAL LETTER YI (Ukrainian)
1290 $string = str_replace("\257", 'Ї', $string);
1292 $string = str_replace("\260", '°', $string);
1294 $string = str_replace("\261", '±', $string);
1295 // CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
1296 $string = str_replace("\262", 'І', $string);
1297 // CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
1298 $string = str_replace("\263", 'і', $string);
1299 // CYRILLIC SMALL LETTER GHE WITH UPTURN
1300 $string = str_replace("\264", 'ґ', $string);
1302 $string = str_replace("\265", 'µ', $string);
1304 $string = str_replace("\266", '¶', $string);
1306 $string = str_replace("\267", '·', $string);
1307 // CYRILLIC SMALL LETTER IO
1308 $string = str_replace("\270", 'ё', $string);
1310 $string = str_replace("\271", '№', $string);
1311 // CYRILLIC SMALL LETTER UKRAINIAN IE
1312 $string = str_replace("\272", 'є', $string);
1313 // RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
1314 $string = str_replace("\273", '»', $string);
1315 // CYRILLIC SMALL LETTER JE
1316 $string = str_replace("\274", 'ј', $string);
1317 // CYRILLIC CAPITAL LETTER DZE
1318 $string = str_replace("\275", 'Ѕ', $string);
1319 // CYRILLIC SMALL LETTER DZE
1320 $string = str_replace("\276", 'ѕ', $string);
1321 // CYRILLIC SMALL LETTER YI (Ukrainian)
1322 $string = str_replace("\277", 'ї', $string);
1324 // 192-255 > 1040-1103 (+848)
1325 $string = preg_replace("/([\300-\377])/e","'&#' . (ord('\\1')+848) . ';'",$string);
1331 windows-1253 (Greek)
1333 function charset_decode_windows_1253 ($string) {
1334 global $default_charset;
1336 if (strtolower($default_charset) == 'windows-1253')
1339 /* Only do the slow convert if there are 8-bit characters */
1340 if (! ereg("[\200-\377]", $string))
1343 $string = str_replace("\200", '€', $string);
1344 $string = str_replace("\202", '‚', $string);
1345 $string = str_replace("\203", 'ƒ', $string);
1346 $string = str_replace("\204", '„', $string);
1347 $string = str_replace("\205", '…', $string);
1348 $string = str_replace("\206", '†', $string);
1349 $string = str_replace("\207", '‡', $string);
1350 $string = str_replace("\211", '‰', $string);
1351 $string = str_replace("\213", '‹', $string);
1352 $string = str_replace("\221", '‘', $string);
1353 $string = str_replace("\222", '’', $string);
1354 $string = str_replace("\223", '“', $string);
1355 $string = str_replace("\224", '”', $string);
1356 $string = str_replace("\225", '•', $string);
1357 $string = str_replace("\226", '–', $string);
1358 $string = str_replace("\227", '—', $string);
1359 $string = str_replace("\231", '™', $string);
1360 $string = str_replace("\233", '›', $string);
1361 $string = str_replace("\241", '΅', $string);
1362 $string = str_replace("\242", 'Ά', $string);
1363 $string = str_replace ("\257", '―', $string);
1364 $string = str_replace("\264", '΄', $string);
1365 $string = str_replace("\270", 'Έ', $string);
1366 $string = str_replace ("\271", 'Ή', $string);
1367 $string = str_replace ("\272", 'Ί', $string);
1368 $string = str_replace ("\274", 'Ό', $string);
1369 // cycle for 190-254 symbols
1370 $string = preg_replace("/([\274-\376])/e","'&#' . (ord('\\1')+720);",$string);
1372 // Rest of charset is like iso-8859-1
1373 return (charset_decode_iso_8859_1($string));
1377 windows-1254 (Turks)
1379 function charset_decode_windows_1254 ($string) {
1380 global $default_charset;
1382 if (strtolower($default_charset) == 'windows-1254')
1385 /* Only do the slow convert if there are 8-bit characters */
1386 if (! ereg("[\200-\377]", $string))
1389 // Euro sign 128 -> 8364
1390 $string = str_replace("\200", '€', $string);
1391 // Single low-9 quotation mark 130 -> 8218
1392 $string = str_replace("\202", '‚', $string);
1393 // latin small letter f with hook 131 -> 402
1394 $string = str_replace("\203", 'ƒ', $string);
1395 // Double low-9 quotation mark 132 -> 8222
1396 $string = str_replace("\204", '„', $string);
1397 // horizontal ellipsis 133 -> 8230
1398 $string = str_replace("\205", '…', $string);
1399 // dagger 134 -> 8224
1400 $string = str_replace("\206", '†', $string);
1401 // double dagger 135 -> 8225
1402 $string = str_replace("\207", '‡', $string);
1403 // modifier letter circumflex accent 136->710
1404 $string = str_replace("\210", 'ˆ', $string);
1405 // per mille sign 137 -> 8240
1406 $string = str_replace("\211", '‰', $string);
1407 // latin capital letter s with caron 138 -> 352
1408 $string = str_replace("\212", 'Š', $string);
1409 // single left-pointing angle quotation mark 139 -> 8249
1410 $string = str_replace("\213", '‹', $string);
1411 // latin capital ligature oe 140 -> 338
1412 $string = str_replace("\214", 'Œ', $string);
1413 // left single quotation mark 145 -> 8216
1414 $string = str_replace("\221", '‘', $string);
1415 // right single quotation mark 146 -> 8217
1416 $string = str_replace("\222", '’', $string);
1417 // left double quotation mark 147 -> 8220
1418 $string = str_replace("\223", '“', $string);
1419 // right double quotation mark 148 -> 8221
1420 $string = str_replace("\224", '”', $string);
1421 // bullet 149 -> 8226
1422 $string = str_replace("\225", '•', $string);
1423 // en dash 150 -> 8211
1424 $string = str_replace("\226", '–', $string);
1425 // em dash 151 -> 8212
1426 $string = str_replace("\227", '—', $string);
1427 // small tilde 152 -> 732
1428 $string = str_replace("\230", '˜', $string);
1429 // trade mark sign 153 -> 8482
1430 $string = str_replace("\231", '™', $string);
1431 // latin small letter s with caron 154 -> 353
1432 $string = str_replace("\232", 'š', $string);
1433 // single right-pointing angle quotation mark 155 -> 8250
1434 $string = str_replace("\233", '›', $string);
1435 // latin small ligature oe 156 -> 339
1436 $string = str_replace("\234", 'œ', $string);
1437 // latin capital letter y with diaresis 159->376
1438 $string = str_replace("\237", 'Ÿ', $string);
1439 // latin capital letter g with breve 208->286
1440 $string = str_replace("\320", 'Ğ', $string);
1441 // latin capital letter i with dot above 221->304
1442 $string = str_replace("\335", 'İ', $string);
1443 // latin capital letter s with cedilla 222->350
1444 $string = str_replace("\336", 'Ş', $string);
1445 // latin small letter g with breve 240->287
1446 $string = str_replace("\360", 'ğ', $string);
1447 // latin small letter dotless i 253->305
1448 $string = str_replace("\375", 'ı', $string);
1449 // latin small letter s with cedilla 254->351
1450 $string = str_replace("\376", 'ş', $string);
1452 // Rest of charset is like iso-8859-1
1453 return (charset_decode_iso_8859_1($string));
1457 windows-1257 (BaltRim)
1459 function charset_decode_windows_1257 ($string) {
1460 global $default_charset;
1462 if (strtolower($default_charset) == 'windows-1257')
1465 /* Only do the slow convert if there are 8-bit characters */
1466 if (! ereg("[\200-\377]", $string))
1469 $string = str_replace("\200", '€', $string);
1470 $string = str_replace("\202", '‚', $string);
1471 $string = str_replace("\204", '„', $string);
1472 $string = str_replace("\205", '…', $string);
1473 $string = str_replace("\206", '†', $string);
1474 $string = str_replace("\207", '‡', $string);
1475 $string = str_replace("\211", '‰', $string);
1476 $string = str_replace("\213", '‹', $string);
1477 $string = str_replace("\215", '¨', $string);
1478 $string = str_replace("\216", 'ˇ', $string);
1479 $string = str_replace("\217", '¸', $string);
1480 $string = str_replace("\221", '‘', $string);
1481 $string = str_replace("\222", '’', $string);
1482 $string = str_replace("\223", '“', $string);
1483 $string = str_replace("\224", '”', $string);
1484 $string = str_replace("\225", '•', $string);
1485 $string = str_replace("\226", '–', $string);
1486 $string = str_replace("\227", '—', $string);
1487 $string = str_replace("\231", '™', $string);
1488 $string = str_replace("\233", '›', $string);
1489 $string = str_replace("\235", '¯', $string);
1490 $string = str_replace("\236", '˛', $string);
1491 $string = str_replace ("\250", 'Ø', $string);
1492 $string = str_replace ("\252", 'Ŗ', $string);
1493 $string = str_replace ("\257", 'Æ', $string);
1494 $string = str_replace ("\270", 'ø', $string);
1495 $string = str_replace ("\272", 'ŗ', $string);
1496 $string = str_replace ("\277", 'æ', $string);
1497 $string = str_replace ("\300", 'Ą', $string);
1498 $string = str_replace ("\301", 'Į', $string);
1499 $string = str_replace ("\302", 'Ā', $string);
1500 $string = str_replace ("\303", 'Ć', $string);
1501 $string = str_replace ("\306", 'Ę', $string);
1502 $string = str_replace ("\307", 'Ē', $string);
1503 $string = str_replace ("\310", 'Č', $string);
1504 $string = str_replace ("\312", 'Ź', $string);
1505 $string = str_replace ("\313", 'Ė', $string);
1506 $string = str_replace ("\314", 'Ģ', $string);
1507 $string = str_replace ("\315", 'Ķ', $string);
1508 $string = str_replace ("\316", 'Ī', $string);
1509 $string = str_replace ("\317", 'Ļ', $string);
1510 $string = str_replace ("\320", 'Š', $string);
1511 $string = str_replace ("\321", 'Ń', $string);
1512 $string = str_replace ("\322", 'Ņ', $string);
1513 $string = str_replace ("\324", 'Ō', $string);
1514 $string = str_replace ("\330", 'Ų', $string);
1515 $string = str_replace ("\331", 'Ł', $string);
1516 $string = str_replace ("\332", 'Ŕ', $string);
1517 $string = str_replace ("\333", 'Ū', $string);
1518 $string = str_replace ("\335", 'Ż', $string);
1519 $string = str_replace ("\336", 'Ž', $string);
1520 $string = str_replace ("\340", 'ą', $string);
1521 $string = str_replace ("\341", 'į', $string);
1522 $string = str_replace ("\342", 'ā', $string);
1523 $string = str_replace ("\343", 'ć', $string);
1524 $string = str_replace ("\346", 'ę', $string);
1525 $string = str_replace ("\347", 'ē', $string);
1526 $string = str_replace ("\350", 'č', $string);
1527 $string = str_replace ("\352", 'ź', $string);
1528 $string = str_replace ("\353", 'ė', $string);
1529 $string = str_replace ("\354", 'ģ', $string);
1530 $string = str_replace ("\355", 'ķ', $string);
1531 $string = str_replace ("\356", 'ī', $string);
1532 $string = str_replace ("\357", 'ļ', $string);
1533 $string = str_replace ("\360", 'š', $string);
1534 $string = str_replace ("\361", 'ń', $string);
1535 $string = str_replace ("\362", 'ņ', $string);
1536 $string = str_replace ("\364", 'ō', $string);
1537 $string = str_replace ("\370", 'ų', $string);
1538 $string = str_replace ("\371", 'ł', $string);
1539 $string = str_replace ("\372", 'ś', $string);
1540 $string = str_replace ("\373", 'ū', $string);
1541 $string = str_replace ("\375", 'ż', $string);
1542 $string = str_replace ("\376", 'ž', $string);
1543 $string = str_replace ("\377", '˙', $string);
1545 // Rest of charset is like iso-8859-1
1546 return (charset_decode_iso_8859_1($string));
1551 * Set up the language to be output
1552 * if $do_search is true, then scan the browser information
1553 * for a possible language that we know
1555 function set_up_language($sm_language, $do_search = false) {
1557 static $SetupAlready = 0;
1558 global $use_gettext, $languages,
1559 $squirrelmail_language, $squirrelmail_default_language,
1562 if ($SetupAlready) {
1566 $SetupAlready = TRUE;
1567 sqgetGlobalVar('HTTP_ACCEPT_LANGUAGE', $accept_lang, SQ_SERVER
);
1569 if ($do_search && ! $sm_language && isset($accept_lang)) {
1570 $sm_language = substr($accept_lang, 0, 2);
1573 if (!$sm_language && isset($squirrelmail_default_language)) {
1574 $squirrelmail_language = $squirrelmail_default_language;
1575 $sm_language = $squirrelmail_default_language;
1577 $sm_notAlias = $sm_language;
1578 while (isset($languages[$sm_notAlias]['ALIAS'])) {
1579 $sm_notAlias = $languages[$sm_notAlias]['ALIAS'];
1582 if ( isset($sm_language) &&
1584 $sm_language != '' &&
1585 isset($languages[$sm_notAlias]['CHARSET']) ) {
1586 bindtextdomain( 'squirrelmail', SM_PATH
. 'locale/' );
1587 textdomain( 'squirrelmail' );
1588 if (function_exists('bind_textdomain_codeset')) {
1589 bind_textdomain_codeset ("squirrelmail", $languages[$sm_notAlias]['CHARSET'] );
1591 if ( !ini_get('safe_mode') &&
1592 getenv( 'LC_ALL' ) != $sm_notAlias ) {
1593 putenv( "LC_ALL=$sm_notAlias" );
1594 putenv( "LANG=$sm_notAlias" );
1595 putenv( "LANGUAGE=$sm_notAlias" );
1597 setlocale(LC_ALL
, $sm_notAlias);
1598 $squirrelmail_language = $sm_notAlias;
1599 if ($squirrelmail_language == 'ja_JP' && function_exists('mb_detect_encoding') ) {
1600 header ('Content-Type: text/html; charset=EUC-JP');
1601 if (!function_exists('mb_internal_encoding')) {
1602 echo _("You need to have php4 installed with the multibyte string function enabled (using configure option --enable-mbstring).");
1604 if (function_exists('mb_language')) {
1605 mb_language('Japanese');
1607 mb_internal_encoding('EUC-JP');
1608 mb_http_output('pass');
1610 header( 'Content-Type: text/html; charset=' . $languages[$sm_notAlias]['CHARSET'] );
1615 function set_my_charset(){
1618 * There can be a $default_charset setting in the
1619 * config.php file, but the user may have a different language
1620 * selected for a user interface. This function checks the
1621 * language selected by the user and tags the outgoing messages
1622 * with the appropriate charset corresponding to the language
1623 * selection. This is "more right" (tm), than just stamping the
1624 * message blindly with the system-wide $default_charset.
1626 global $data_dir, $username, $default_charset, $languages, $squirrelmail_default_language;
1628 $my_language = getPref($data_dir, $username, 'language');
1629 if (!$my_language) {
1630 $my_language = $squirrelmail_default_language ;
1632 while (isset($languages[$my_language]['ALIAS'])) {
1633 $my_language = $languages[$my_language]['ALIAS'];
1635 $my_charset = $languages[$my_language]['CHARSET'];
1637 $default_charset = $my_charset;
1641 /* ------------------------------ main --------------------------- */
1643 global $squirrelmail_language, $languages, $use_gettext;
1645 if (! isset($squirrelmail_language)) {
1646 $squirrelmail_language = '';
1649 /* This array specifies the available languages. */
1651 // The glibc locale is ca_ES.
1653 $languages['ca_ES']['NAME'] = 'Catalan';
1654 $languages['ca_ES']['CHARSET'] = 'iso-8859-1';
1655 $languages['ca']['ALIAS'] = 'ca_ES';
1657 $languages['cs_CZ']['NAME'] = 'Czech';
1658 $languages['cs_CZ']['CHARSET'] = 'iso-8859-2';
1659 $languages['cs']['ALIAS'] = 'cs_CZ';
1661 // Danish locale is da_DK.
1663 $languages['da_DK']['NAME'] = 'Danish';
1664 $languages['da_DK']['CHARSET'] = 'iso-8859-1';
1665 $languages['da']['ALIAS'] = 'da_DK';
1667 $languages['de_DE']['NAME'] = 'Deutsch';
1668 $languages['de_DE']['CHARSET'] = 'iso-8859-1';
1669 $languages['de']['ALIAS'] = 'de_DE';
1671 // There is no en_EN! There is en_US, en_BR, en_AU, and so forth,
1672 // but who cares about !US, right? Right? :)
1674 $languages['el_GR']['NAME'] = 'Greek';
1675 $languages['el_GR']['CHARSET'] = 'iso-8859-7';
1676 $languages['el']['ALIAS'] = 'el_GR';
1678 $languages['en_US']['NAME'] = 'English';
1679 $languages['en_US']['CHARSET'] = 'iso-8859-1';
1680 $languages['en']['ALIAS'] = 'en_US';
1682 $languages['es_ES']['NAME'] = 'Spanish';
1683 $languages['es_ES']['CHARSET'] = 'iso-8859-1';
1684 $languages['es']['ALIAS'] = 'es_ES';
1686 $languages['et_EE']['NAME'] = 'Estonian';
1687 $languages['et_EE']['CHARSET'] = 'iso-8859-15';
1688 $languages['et']['ALIAS'] = 'et_EE';
1690 $languages['fo_FO']['NAME'] = 'Faroese';
1691 $languages['fo_FO']['CHARSET'] = 'iso-8859-1';
1692 $languages['fo']['ALIAS'] = 'fo_FO';
1694 $languages['fi_FI']['NAME'] = 'Finnish';
1695 $languages['fi_FI']['CHARSET'] = 'iso-8859-1';
1696 $languages['fi']['ALIAS'] = 'fi_FI';
1698 $languages['fr_FR']['NAME'] = 'French';
1699 $languages['fr_FR']['CHARSET'] = 'iso-8859-1';
1700 $languages['fr']['ALIAS'] = 'fr_FR';
1702 $languages['hr_HR']['NAME'] = 'Croatian';
1703 $languages['hr_HR']['CHARSET'] = 'iso-8859-2';
1704 $languages['hr']['ALIAS'] = 'hr_HR';
1706 $languages['hu_HU']['NAME'] = 'Hungarian';
1707 $languages['hu_HU']['CHARSET'] = 'iso-8859-2';
1708 $languages['hu']['ALIAS'] = 'hu_HU';
1710 $languages['id_ID']['NAME'] = 'Bahasa Indonesia';
1711 $languages['id_ID']['CHARSET'] = 'iso-8859-1';
1712 $languages['id']['ALIAS'] = 'id_ID';
1714 $languages['is_IS']['NAME'] = 'Icelandic';
1715 $languages['is_IS']['CHARSET'] = 'iso-8859-1';
1716 $languages['is']['ALIAS'] = 'is_IS';
1718 $languages['it_IT']['NAME'] = 'Italian';
1719 $languages['it_IT']['CHARSET'] = 'iso-8859-1';
1720 $languages['it']['ALIAS'] = 'it_IT';
1722 $languages['ja_JP']['NAME'] = 'Japanese';
1723 $languages['ja_JP']['CHARSET'] = 'iso-2022-jp';
1724 $languages['ja_JP']['XTRA_CODE'] = 'japanese_charset_xtra';
1725 $languages['ja']['ALIAS'] = 'ja_JP';
1727 $languages['ko_KR']['NAME'] = 'Korean';
1728 $languages['ko_KR']['CHARSET'] = 'euc-KR';
1729 $languages['ko_KR']['XTRA_CODE'] = 'korean_charset_xtra';
1730 $languages['ko']['ALIAS'] = 'ko_KR';
1732 $languages['nl_NL']['NAME'] = 'Dutch';
1733 $languages['nl_NL']['CHARSET'] = 'iso-8859-1';
1734 $languages['nl']['ALIAS'] = 'nl_NL';
1736 $languages['no_NO']['NAME'] = 'Norwegian (Bokmål)';
1737 $languages['no_NO']['CHARSET'] = 'iso-8859-1';
1738 $languages['no']['ALIAS'] = 'no_NO';
1739 $languages['nn_NO']['NAME'] = 'Norwegian (Nynorsk)';
1740 $languages['nn_NO']['CHARSET'] = 'iso-8859-1';
1742 $languages['pl_PL']['NAME'] = 'Polish';
1743 $languages['pl_PL']['CHARSET'] = 'iso-8859-2';
1744 $languages['pl']['ALIAS'] = 'pl_PL';
1746 $languages['pt_PT']['NAME'] = 'Portuguese (Portugal)';
1747 $languages['pt_PT']['CHARSET'] = 'iso-8859-1';
1748 $languages['pt_BR']['NAME'] = 'Portuguese (Brazil)';
1749 $languages['pt_BR']['CHARSET'] = 'iso-8859-1';
1750 $languages['pt']['ALIAS'] = 'pt_PT';
1752 $languages['ru_RU']['NAME'] = 'Russian';
1753 $languages['ru_RU']['CHARSET'] = 'koi8-r';
1754 $languages['ru']['ALIAS'] = 'ru_RU';
1756 $languages['sr_YU']['NAME'] = 'Serbian';
1757 $languages['sr_YU']['CHARSET'] = 'iso-8859-2';
1758 $languages['sr']['ALIAS'] = 'sr_YU';
1760 $languages['sv_SE']['NAME'] = 'Swedish';
1761 $languages['sv_SE']['CHARSET'] = 'iso-8859-1';
1762 $languages['sv']['ALIAS'] = 'sv_SE';
1764 $languages['tr_TR']['NAME'] = 'Turkish';
1765 $languages['tr_TR']['CHARSET'] = 'iso-8859-9';
1766 $languages['tr']['ALIAS'] = 'tr_TR';
1768 $languages['zh_TW']['NAME'] = 'Chinese Trad';
1769 $languages['zh_TW']['CHARSET'] = 'big5';
1770 $languages['tw']['ALIAS'] = 'zh_TW';
1772 $languages['zh_CN']['NAME'] = 'Chinese Simp';
1773 $languages['zh_CN']['CHARSET'] = 'gb2312';
1774 $languages['cn']['ALIAS'] = 'zh_CN';
1776 $languages['sk_SK']['NAME'] = 'Slovak';
1777 $languages['sk_SK']['CHARSET'] = 'iso-8859-2';
1778 $languages['sk']['ALIAS'] = 'sk_SK';
1780 $languages['ro_RO']['NAME'] = 'Romanian';
1781 $languages['ro_RO']['CHARSET'] = 'iso-8859-2';
1782 $languages['ro']['ALIAS'] = 'ro_RO';
1784 $languages['th_TH']['NAME'] = 'Thai';
1785 $languages['th_TH']['CHARSET'] = 'tis-620';
1786 $languages['th']['ALIAS'] = 'th_TH';
1788 $languages['lt_LT']['NAME'] = 'Lithuanian';
1789 $languages['lt_LT']['CHARSET'] = 'windows-1257';
1790 $languages['lt']['ALIAS'] = 'lt_LT';
1792 $languages['sl_SI']['NAME'] = 'Slovenian';
1793 $languages['sl_SI']['CHARSET'] = 'iso-8859-2';
1794 $languages['sl']['ALIAS'] = 'sl_SI';
1796 $languages['bg_BG']['NAME'] = 'Bulgarian';
1797 $languages['bg_BG']['CHARSET'] = 'windows-1251';
1798 $languages['bg']['ALIAS'] = 'bg_BG';
1800 $languages['uk_UA']['NAME'] = 'Ukrainian';
1801 $languages['uk_UA']['CHARSET'] = 'koi8-u';
1802 $languages['uk']['ALIAS'] = 'uk_UA';
1804 $languages['cy_GB']['NAME'] = 'Welsh';
1805 $languages['cy_GB']['CHARSET'] = 'iso-8859-1';
1806 $languages['cy']['ALIAS'] = 'cy_GB';
1808 $languages['vi_VN']['NAME'] = 'Vietnamese';
1809 $languages['vi_VN']['CHARSET'] = 'utf-8';
1810 $languages['vi']['ALIAS'] = 'vi_VN';
1812 // Right to left languages
1814 $languages['ar']['NAME'] = 'Arabic';
1815 $languages['ar']['CHARSET'] = 'windows-1256';
1816 $languages['ar']['DIR'] = 'rtl';
1818 $languages['he_IL']['NAME'] = 'Hebrew';
1819 $languages['he_IL']['CHARSET'] = 'windows-1255';
1820 $languages['he_IL']['DIR'] = 'rtl';
1821 $languages['he']['ALIAS'] = 'he_IL';
1823 /* Detect whether gettext is installed. */
1825 if (function_exists('_')) {
1826 $gettext_flags +
= 1;
1828 if (function_exists('bindtextdomain')) {
1829 $gettext_flags +
= 2;
1831 if (function_exists('textdomain')) {
1832 $gettext_flags +
= 4;
1835 /* If gettext is fully loaded, cool */
1836 if ($gettext_flags == 7) {
1837 $use_gettext = true;
1839 /* If we can fake gettext, try that */
1840 elseif ($gettext_flags == 0) {
1841 $use_gettext = true;
1842 include_once(SM_PATH
. 'functions/gettext.php');
1844 /* Uh-ho. A weird install */
1845 if (! $gettext_flags & 1) {
1850 if (! $gettext_flags & 2) {
1851 function bindtextdomain() {
1855 if (! $gettext_flags & 4) {
1856 function textdomain() {
1862 function charset_decode_utf8 ($string) {
1864 Every decoded character consists of n bytes. First byte is octal
1865 300-375, other bytes - always octals 200-277.
1867 \a\b characters are decoded to html code octdec(a-300)*64 + octdec(b-200)
1868 \a\b\c characters are decoded to html code octdec(a-340)*64*64 + octdec(b-200)*64 + octdec(c-200)
1870 decoding cycle is unfinished. please test and report problems to tokul@users.sourceforge.net
1872 global $default_charset, $languages, $sm_notAlias;
1874 if (strtolower($default_charset) == 'utf-8')
1876 if (strtolower($languages[$sm_notAlias]['CHARSET']) == 'utf-8')
1879 /* Only do the slow convert if there are 8-bit characters */
1880 if (! ereg("[\200-\377]", $string))
1883 // decode three byte unicode characters
1884 $string = preg_replace("/([\340-\357])([\200-\277])([\200-\277])/e",
1885 "'&#'.((ord('\\1')-224)*4096+(ord('\\2')-128)*64+(ord('\\3')-128)).';'",
1888 // decode two byte unicode characters
1889 $string = preg_replace("/([\300-\337])([\200-\277])/e",
1890 "'&#'.((ord('\\1')-192)*64+(ord('\\2')-128)).';'",
1897 * Japanese charset extra function
1900 function japanese_charset_xtra() {
1901 $ret = func_get_arg(1); /* default return value */
1902 if (function_exists('mb_detect_encoding')) {
1903 switch (func_get_arg(0)) { /* action */
1905 $detect_encoding = @mb_detect_encoding
($ret);
1906 if ($detect_encoding == 'JIS' ||
1907 $detect_encoding == 'EUC-JP' ||
1908 $detect_encoding == 'SJIS' ||
1909 $detect_encoding == 'UTF-8') {
1911 $ret = mb_convert_kana(mb_convert_encoding($ret, 'EUC-JP', 'AUTO'), "KV");
1915 $detect_encoding = @mb_detect_encoding
($ret);
1916 if ($detect_encoding == 'JIS' ||
1917 $detect_encoding == 'EUC-JP' ||
1918 $detect_encoding == 'SJIS' ||
1919 $detect_encoding == 'UTF-8') {
1921 $ret = mb_convert_encoding(mb_convert_kana($ret, "KV"), 'JIS', 'AUTO');
1925 $width = func_get_arg(2);
1926 $ret = mb_strimwidth($ret, 0, $width, '...');
1928 case 'encodeheader':
1930 if (strlen($ret) > 0) {
1931 $tmpstr = mb_substr($ret, 0, 1);
1932 $prevcsize = strlen($tmpstr);
1933 for ($i = 1; $i < mb_strlen($ret); $i++
) {
1934 $tmp = mb_substr($ret, $i, 1);
1935 if (strlen($tmp) == $prevcsize) {
1938 if ($prevcsize == 1) {
1941 $result .= str_replace(' ', '',
1942 mb_encode_mimeheader($tmpstr,'iso-2022-jp','B',''));
1945 $prevcsize = strlen($tmp);
1948 if (strlen($tmpstr)) {
1949 if (strlen(mb_substr($tmpstr, 0, 1)) == 1)
1952 $result .= str_replace(' ', '',
1953 mb_encode_mimeheader($tmpstr,'iso-2022-jp','B',''));
1958 case 'decodeheader':
1959 $ret = str_replace("\t", "", $ret);
1960 if (eregi('=\\?([^?]+)\\?(q|b)\\?([^?]+)\\?=', $ret))
1961 $ret = @mb_decode_mimeheader
($ret);
1962 $ret = @mb_convert_encoding
($ret, 'EUC-JP', 'AUTO');
1964 case 'downloadfilename':
1965 $useragent = func_get_arg(2);
1966 if (strstr($useragent, 'Windows') !== false ||
1967 strstr($useragent, 'Mac_') !== false) {
1968 $ret = mb_convert_encoding($ret, 'SJIS', 'AUTO');
1970 $ret = mb_convert_encoding($ret, 'EUC-JP', 'AUTO');
1974 $no_begin = "\x21\x25\x29\x2c\x2e\x3a\x3b\x3f\x5d\x7d\xa1\xf1\xa1\xeb\xa1" .
1975 "\xc7\xa1\xc9\xa2\xf3\xa1\xec\xa1\xed\xa1\xee\xa1\xa2\xa1\xa3\xa1\xb9" .
1976 "\xa1\xd3\xa1\xd5\xa1\xd7\xa1\xd9\xa1\xdb\xa1\xcd\xa4\xa1\xa4\xa3\xa4" .
1977 "\xa5\xa4\xa7\xa4\xa9\xa4\xc3\xa4\xe3\xa4\xe5\xa4\xe7\xa4\xee\xa1\xab" .
1978 "\xa1\xac\xa1\xb5\xa1\xb6\xa5\xa1\xa5\xa3\xa5\xa5\xa5\xa7\xa5\xa9\xa5" .
1979 "\xc3\xa5\xe3\xa5\xe5\xa5\xe7\xa5\xee\xa5\xf5\xa5\xf6\xa1\xa6\xa1\xbc" .
1980 "\xa1\xb3\xa1\xb4\xa1\xaa\xa1\xf3\xa1\xcb\xa1\xa4\xa1\xa5\xa1\xa7\xa1" .
1981 "\xa8\xa1\xa9\xa1\xcf\xa1\xd1";
1982 $no_end = "\x5c\x24\x28\x5b\x7b\xa1\xf2\x5c\xa1\xc6\xa1\xc8\xa1\xd2\xa1" .
1983 "\xd4\xa1\xd6\xa1\xd8\xa1\xda\xa1\xcc\xa1\xf0\xa1\xca\xa1\xce\xa1\xd0\xa1\xef";
1984 $wrap = func_get_arg(2);
1986 if (strlen($ret) >= $wrap &&
1987 substr($ret, 0, 1) != '>' &&
1988 strpos($ret, 'http://') === FALSE &&
1989 strpos($ret, 'https://') === FALSE &&
1990 strpos($ret, 'ftp://') === FALSE) {
1992 $ret = mb_convert_kana($ret, "KV");
1997 while ($ptr < strlen($ret) - 1) {
1998 $l = mb_strcut($ret, $ptr, $wrap);
2002 $l = mb_strcut($ret, $ptr, 2);
2003 while (strlen($l) != 0 && mb_strpos($no_begin, $l) !== FALSE ) {
2006 $l = mb_strcut($ret, $ptr, 1);
2009 if ($ptr < strlen($ret) - 1)
2015 case 'utf7-imap_encode':
2016 $ret = mb_convert_encoding($ret, 'UTF7-IMAP', 'EUC-JP');
2018 case 'utf7-imap_decode':
2019 $ret = mb_convert_encoding($ret, 'EUC-JP', 'UTF7-IMAP');
2028 * Korean charset extra function
2029 * Hangul(Korean Character) Attached File Name Fix.
2031 function korean_charset_xtra() {
2033 $ret = func_get_arg(1); /* default return value */
2034 if (func_get_arg(0) == 'downloadfilename') { /* action */
2035 $ret = str_replace("\x0D\x0A", '', $ret); /* Hanmail's CR/LF Clear */
2036 for ($i=0;$i<strlen($ret);$i++
) {
2037 if ($ret[$i] >= "\xA1" && $ret[$i] <= "\xFE") { /* 0xA1 - 0XFE are Valid */
2040 } else if (($ret[$i] >= 'a' && $ret[$i] <= 'z') ||
/* From Original ereg_replace in download.php */
2041 ($ret[$i] >= 'A' && $ret[$i] <= 'Z') ||
2042 ($ret[$i] == '.') ||
($ret[$i] == '-')) {