Added full character translation tables for ISO-8859-1, 7 and 15.
[squirrelmail.git] / functions / i18n.php
CommitLineData
1fd97780 1<?
2
3/**
4 ** i18n.php
5 **
6 ** This file contains variuos functions that are needed to do
7 ** internationalization of SquirrelMail.
8 **
9 ** Internally iso-8859-1 is used as character set. Other characters
10 ** are encoded using Unicode entities according to HTML 4.0.
173ed887 11 **
1fd97780 12 **/
13
14 $i18n_php = true;
15
d30d79f2 16 // This array specifies the available languages.
17 $languages[0]["NAME"] = "English";
18 $languages[0]["CODE"] = "en";
19 $languages[1]["NAME"] = "Norsk";
20 $languages[1]["CODE"] = "no";
907762bb 21 $languages[2]["NAME"] = "Deutcsh";
22 $languages[2]["CODE"] = "de";
e4ff0781 23 $languages[2]["NAME"] = "Russian KOI8-R";
24 $languages[2]["CODE"] = "ru";
d30d79f2 25
1fd97780 26 // Decodes a string to the internal encoding from the given charset
27 function charset_decode ($charset, $string) {
28 // All HTML special characters are 7 bit and can be replaced first
29 $string = htmlspecialchars ($string);
30
44139266 31 $charset = strtolower($charset);
1fd97780 32
33 if (ereg("iso-8859-(.*)", $charset, $res)) {
34 if ($res[1] == "1")
35 return charset_decode_iso_8859_1 ($string);
173ed887 36 if ($res[1] == "7")
37 return charset_decode_iso_8859_7 ($string);
1fd97780 38 else if ($res[1] == "15")
39 return charset_decode_iso_8859_15 ($string);
40 else
41 return charset_decode_iso_8859_default ($string);
42 } else if ($charset == "ns_4551-1") {
43 return charset_decode_ns_4551_1 ($string);
17ce8467 44 } else if ($charset == "koi8-r") {
45 return charset_decode_koi8r ($string);
209e2f82 46 } else
04563822 47 return "xx$charset:$string";
1fd97780 48 }
49
50 // iso-8859-1 is the same as Latin 1 and is normally used
51 // in western europe.
52 function charset_decode_iso_8859_1 ($string) {
04563822 53 global $default_charset;
1fd97780 54
04563822 55 if (strtolower($default_charset) == "iso-8859-1") {
56 return $string;
57 } else {
58 // Only do the slow convert if there are 8-bit characters
59 if (ereg("[\200-\377]", $string)) {
60 $string = str_replace("\201", "&#129;", $string);
61 $string = str_replace("\202", "&#130;", $string);
62 $string = str_replace("\203", "&#131;", $string);
63 $string = str_replace("\204", "&#132;", $string);
64 $string = str_replace("\205", "&#133;", $string);
65 $string = str_replace("\206", "&#134;", $string);
66 $string = str_replace("\207", "&#135;", $string);
67 $string = str_replace("\210", "&#136;", $string);
68 $string = str_replace("\211", "&#137;", $string);
69 $string = str_replace("\212", "&#138;", $string);
70 $string = str_replace("\213", "&#139;", $string);
71 $string = str_replace("\214", "&#140;", $string);
72 $string = str_replace("\215", "&#141;", $string);
73 $string = str_replace("\216", "&#142;", $string);
74 $string = str_replace("\217", "&#143;", $string);
75 $string = str_replace("\220", "&#144;", $string);
76 $string = str_replace("\221", "&#145;", $string);
77 $string = str_replace("\222", "&#146;", $string);
78 $string = str_replace("\223", "&#147;", $string);
79 $string = str_replace("\224", "&#148;", $string);
80 $string = str_replace("\225", "&#149;", $string);
81 $string = str_replace("\226", "&#150;", $string);
82 $string = str_replace("\227", "&#151;", $string);
83 $string = str_replace("\230", "&#152;", $string);
84 $string = str_replace("\231", "&#153;", $string);
85 $string = str_replace("\232", "&#154;", $string);
86 $string = str_replace("\233", "&#155;", $string);
87 $string = str_replace("\234", "&#156;", $string);
88 $string = str_replace("\235", "&#157;", $string);
89 $string = str_replace("\236", "&#158;", $string);
90 $string = str_replace("\237", "&#159;", $string);
91 $string = str_replace("\240", "&#160;", $string);
92 $string = str_replace("\241", "&#161;", $string);
93 $string = str_replace("\242", "&#162;", $string);
94 $string = str_replace("\243", "&#163;", $string);
95 $string = str_replace("\244", "&#164;", $string);
96 $string = str_replace("\245", "&#165;", $string);
97 $string = str_replace("\246", "&#166;", $string);
98 $string = str_replace("\247", "&#167;", $string);
99 $string = str_replace("\250", "&#168;", $string);
100 $string = str_replace("\251", "&#169;", $string);
101 $string = str_replace("\252", "&#170;", $string);
102 $string = str_replace("\253", "&#171;", $string);
103 $string = str_replace("\254", "&#172;", $string);
104 $string = str_replace("\255", "&#173;", $string);
105 $string = str_replace("\256", "&#174;", $string);
106 $string = str_replace("\257", "&#175;", $string);
107 $string = str_replace("\260", "&#176;", $string);
108 $string = str_replace("\261", "&#177;", $string);
109 $string = str_replace("\262", "&#178;", $string);
110 $string = str_replace("\263", "&#179;", $string);
111 $string = str_replace("\264", "&#180;", $string);
112 $string = str_replace("\265", "&#181;", $string);
113 $string = str_replace("\266", "&#182;", $string);
114 $string = str_replace("\267", "&#183;", $string);
115 $string = str_replace("\270", "&#184;", $string);
116 $string = str_replace("\271", "&#185;", $string);
117 $string = str_replace("\272", "&#186;", $string);
118 $string = str_replace("\273", "&#187;", $string);
119 $string = str_replace("\274", "&#188;", $string);
120 $string = str_replace("\275", "&#189;", $string);
121 $string = str_replace("\276", "&#190;", $string);
122 $string = str_replace("\277", "&#191;", $string);
123 $string = str_replace("\300", "&#192;", $string);
124 $string = str_replace("\301", "&#193;", $string);
125 $string = str_replace("\302", "&#194;", $string);
126 $string = str_replace("\303", "&#195;", $string);
127 $string = str_replace("\304", "&#196;", $string);
128 $string = str_replace("\305", "&#197;", $string);
129 $string = str_replace("\306", "&#198;", $string);
130 $string = str_replace("\307", "&#199;", $string);
131 $string = str_replace("\310", "&#200;", $string);
132 $string = str_replace("\311", "&#201;", $string);
133 $string = str_replace("\312", "&#202;", $string);
134 $string = str_replace("\313", "&#203;", $string);
135 $string = str_replace("\314", "&#204;", $string);
136 $string = str_replace("\315", "&#205;", $string);
137 $string = str_replace("\316", "&#206;", $string);
138 $string = str_replace("\317", "&#207;", $string);
139 $string = str_replace("\320", "&#208;", $string);
140 $string = str_replace("\321", "&#209;", $string);
141 $string = str_replace("\322", "&#210;", $string);
142 $string = str_replace("\323", "&#211;", $string);
143 $string = str_replace("\324", "&#212;", $string);
144 $string = str_replace("\325", "&#213;", $string);
145 $string = str_replace("\326", "&#214;", $string);
146 $string = str_replace("\327", "&#215;", $string);
147 $string = str_replace("\330", "&#216;", $string);
148 $string = str_replace("\331", "&#217;", $string);
149 $string = str_replace("\332", "&#218;", $string);
150 $string = str_replace("\333", "&#219;", $string);
151 $string = str_replace("\334", "&#220;", $string);
152 $string = str_replace("\335", "&#221;", $string);
153 $string = str_replace("\336", "&#222;", $string);
154 $string = str_replace("\337", "&#223;", $string);
155 $string = str_replace("\340", "&#224;", $string);
156 $string = str_replace("\341", "&#225;", $string);
157 $string = str_replace("\342", "&#226;", $string);
158 $string = str_replace("\343", "&#227;", $string);
159 $string = str_replace("\344", "&#228;", $string);
160 $string = str_replace("\345", "&#229;", $string);
161 $string = str_replace("\346", "&#230;", $string);
162 $string = str_replace("\347", "&#231;", $string);
163 $string = str_replace("\350", "&#232;", $string);
164 $string = str_replace("\351", "&#233;", $string);
165 $string = str_replace("\352", "&#234;", $string);
166 $string = str_replace("\353", "&#235;", $string);
167 $string = str_replace("\354", "&#236;", $string);
168 $string = str_replace("\355", "&#237;", $string);
169 $string = str_replace("\356", "&#238;", $string);
170 $string = str_replace("\357", "&#239;", $string);
171 $string = str_replace("\360", "&#240;", $string);
172 $string = str_replace("\361", "&#241;", $string);
173 $string = str_replace("\362", "&#242;", $string);
174 $string = str_replace("\363", "&#243;", $string);
175 $string = str_replace("\364", "&#244;", $string);
176 $string = str_replace("\365", "&#245;", $string);
177 $string = str_replace("\366", "&#246;", $string);
178 $string = str_replace("\367", "&#247;", $string);
179 $string = str_replace("\370", "&#248;", $string);
180 $string = str_replace("\371", "&#249;", $string);
181 $string = str_replace("\372", "&#250;", $string);
182 $string = str_replace("\373", "&#251;", $string);
183 $string = str_replace("\374", "&#252;", $string);
184 $string = str_replace("\375", "&#253;", $string);
185 $string = str_replace("\376", "&#254;", $string);
186 $string = str_replace("\377", "&#255;", $string);
187 }
188 }
1fd97780 189
190 return ($string);
191 }
192
0a86e9f3 193 // iso-8859-7 is Greek.
209e2f82 194 function charset_decode_iso_8859_7 ($string) {
04563822 195 global $default_charset;
173ed887 196
04563822 197 if (strtolower($default_charset) == "iso-8859-7") {
198 return $string;
199 } else {
200 // Only do the slow convert if there are 8-bit characters
201 if (ereg("[\200-\377]", $string)) {
202 // Some diverse characters in the beginning
203 $string = str_replace("\240", "&#160;", $string);
204 $string = str_replace("\241", "&#8216;", $string);
205 $string = str_replace("\242", "&#8217;", $string);
206 $string = str_replace("\243", "&#163;", $string);
207 $string = str_replace("\246", "&#166;", $string);
208 $string = str_replace("\247", "&#167;", $string);
209 $string = str_replace("\250", "&#168;", $string);
210 $string = str_replace("\251", "&#169;", $string);
211 $string = str_replace("\253", "&#171;", $string);
212 $string = str_replace("\254", "&#172;", $string);
213 $string = str_replace("\255", "&#173;", $string);
214 $string = str_replace("\257", "&#8213;", $string);
215 $string = str_replace("\260", "&#176;", $string);
216 $string = str_replace("\261", "&#177;", $string);
217 $string = str_replace("\262", "&#178;", $string);
218 $string = str_replace("\263", "&#179;", $string);
219
220 // Horizontal bar (parentheki pavla)
221 $string = str_replace ("\257", "&#8213;", $string);
222
223 // ISO-8859-7 characters from 11/04 (0xB4) to 11/06 (0xB6)
224 // These are Unicode 900-902
225 while (ereg("([\264-\266])", $string, $res)) {
226 $replace = "&#" . (ord($res[1])+720) . ";";
227 $string = str_replace($res[1], $replace, $string);
228 }
229
230 // 11/07 (0xB7) Middle dot is the same in iso-8859-1
231 $string = str_replace("\267", "&#183;", $string);
232
233 // ISO-8859-7 characters from 11/08 (0xB8) to 11/10 (0xBA)
234 // These are Unicode 900-902
235 while (ereg("([\270-\272])", $string, $res)) {
236 $replace = "&#" . (ord($res[1])+720) . ";";
237 $string = str_replace($res[1], $replace, $string);
238 }
239
240 // 11/11 (0xBB) Right angle quotation mark is the same as in
241 // iso-8859-1
242 $string = str_replace("\273", "&#187;", $string);
243
244 // And now the rest of the charset
245 while (ereg("([\274-\376])", $string, $res)) {
246 $replace = "&#" . (ord($res[1])+720) . ";";
247 $string = str_replace($res[1], $replace, $string);
248 }
249 }
173ed887 250 }
251
252 return $string;
253 }
254
1fd97780 255 // iso-8859-15 is Latin 15 and has very much the same use as Latin 1
256 // but has the Euro symbol and some characters needed for French.
257 function charset_decode_iso_8859_15 ($string) {
258 // Euro sign
d23e472b 259 $string = str_replace ("\244", "&#8364;", $string);
1fd97780 260 // Latin capital letter S with caron
d23e472b 261 $string = str_replace ("\244", "&#352;", $string);
1fd97780 262 // Latin small letter s with caron
d23e472b 263 $string = str_replace ("\250", "&#353;", $string);
1fd97780 264 // Latin capital letter Z with caron
d23e472b 265 $string = str_replace ("\264", "&#381;", $string);
1fd97780 266 // Latin small letter z with caron
d23e472b 267 $string = str_replace ("\270", "&#382;", $string);
1fd97780 268 // Latin capital ligature OE
d23e472b 269 $string = str_replace ("\274", "&#338;", $string);
1fd97780 270 // Latin small ligature oe
d23e472b 271 $string = str_replace ("\275", "&#339;", $string);
1fd97780 272 // Latin capital letter Y with diaeresis
d23e472b 273 $string = str_replace ("\276", "&#376;", $string);
1fd97780 274
04563822 275 return (charset_decode_iso_8859_1($string));
1fd97780 276 }
277
17ce8467 278 // ISO-8859-15 is Cyrillic
279 function charset_decode_iso_8859_5 ($string) {
d23e472b 280 // Convert to KOI8-R, then return this decoded.
281 $string = convert_cyr_string($string, "i", "k");
282 return charset_decode_koi8r($string);
17ce8467 283 }
284
173ed887 285 // Remove all 8 bit characters from all other ISO-8859 character sets
1fd97780 286 function charset_decode_iso_8859_default ($string) {
287 return (strtr($string, "\240\241\242\243\244\245\246\247".
288 "\250\251\252\253\254\255\256\257".
289 "\260\261\262\263\264\265\266\267".
290 "\270\271\272\273\274\275\276\277".
291 "\300\301\302\303\304\305\306\307".
292 "\310\311\312\313\314\315\316\317".
293 "\320\321\322\323\324\325\326\327".
294 "\330\331\332\333\334\335\336\337".
295 "\340\341\342\343\344\345\346\347".
296 "\350\351\352\353\354\355\356\357".
297 "\360\361\362\363\364\365\366\367".
298 "\370\371\372\373\374\375\376\377",
299 "????????????????????????????????????????".
300 "????????????????????????????????????????".
301 "????????????????????????????????????????".
302 "????????"));
303
304 }
305
306 // This is the same as ISO-646-NO and is used by some
307 // Microsoft programs when sending Norwegian characters
308 function charset_decode_ns_4551_1 ($string) {
309 // These characters are:
310 // Latin capital letter AE
311 // Latin capital letter O with stroke
312 // Latin capital letter A with ring above
313 // and the same as small letters
314