6 ** This file contains variuos functions that are needed to do
7 ** internationalization of SquirrelMail.
9 ** Internally iso-8859-1 is used as character set. Other characters
10 ** are encoded using Unicode entities according to HTML 4.0.
16 // This array specifies the available languages.
17 $languages[0]["NAME"] = "English";
18 $languages[0]["CODE"] = "en";
19 $languages[1]["NAME"] = "Norsk";
20 $languages[1]["CODE"] = "no";
21 $languages[2]["NAME"] = "Deutcsh";
22 $languages[2]["CODE"] = "de";
23 $languages[2]["NAME"] = "Russian KOI8-R";
24 $languages[2]["CODE"] = "ru";
26 // Decodes a string to the internal encoding from the given charset
27 function charset_decode ($charset, $string) {
28 // All HTML special characters are 7 bit and can be replaced first
29 $string = htmlspecialchars ($string);
31 $charset = strtolower($charset);
33 if (ereg("iso-8859-(.*)", $charset, $res)) {
35 return charset_decode_iso_8859_1 ($string);
37 return charset_decode_iso_8859_7 ($string);
38 else if ($res[1] == "15")
39 return charset_decode_iso_8859_15 ($string);
41 return charset_decode_iso_8859_default ($string);
42 } else if ($charset == "ns_4551-1") {
43 return charset_decode_ns_4551_1 ($string);
44 } else if ($charset == "koi8-r") {
45 return charset_decode_koi8r ($string);
50 // iso-8859-1 is the same as Latin 1 and is normally used
52 function charset_decode_iso_8859_1 ($string) {
53 // This is only debug code as long as the internal
54 // character set is iso-8859-1
56 // Latin small letter o with stroke
57 $string = str_replace ("\370", "ø", $string);
62 // iso-8859-7 is Greek.
63 function charset_decode_iso_8859_7 ($string) {
64 // Could not find Unicode equivalent of 0xA1 and 0xA2
65 // 0xA4, 0xA5, 0xAA, 0xAE, 0xD2 and 0xFF should not be used
66 $string = strtr($string, "\241\242\244\245\252\256\322\377",
69 // Horizontal bar (parentheki pavla)
70 while (ereg("\257", $string))
71 $string = str_replace ("\257", "―", $string);
73 // ISO-8859-7 characters from 11/04 (0xB4) to 11/06 (0xB6)
74 // These are Unicode 900-902
75 while (ereg("([\264-\266])", $string, $res)) {
76 $replace = "&#" . (ord($res[1])+
720) . ";";
77 $string = str_replace($res[1], $replace, $string);
80 // 11/07 (0xB7) Middle dot is the same in iso-8859-1
82 // ISO-8859-7 characters from 11/08 (0xB8) to 11/10 (0xBA)
83 // These are Unicode 900-902
84 while (ereg("([\270-\272])", $string, $res)) {
85 $replace = "&#" . (ord($res[1])+
720) . ";";
86 $string = str_replace($res[1], $replace, $string);
89 // 11/11 (0xBB) Right angle quotation mark is the same as in
92 // And now the rest of the charset
93 while (ereg("([\273-\376])", $string, $res)) {
94 $replace = "&#" . (ord($res[1])+
720) . ";";
95 $string = str_replace($res[1], $replace, $string);
101 // iso-8859-15 is Latin 15 and has very much the same use as Latin 1
102 // but has the Euro symbol and some characters needed for French.
103 function charset_decode_iso_8859_15 ($string) {
105 $string = str_replace ("\244", "€", $string);
106 // Latin capital letter S with caron
107 $string = str_replace ("\244", "Š", $string);
108 // Latin small letter s with caron
109 $string = str_replace ("\250", "š", $string);
110 // Latin capital letter Z with caron
111 $string = str_replace ("\264", "Ž", $string);
112 // Latin small letter z with caron
113 $string = str_replace ("\270", "ž", $string);
114 // Latin capital ligature OE
115 $string = str_replace ("\274", "Œ", $string);
116 // Latin small ligature oe
117 $string = str_replace ("\275", "œ", $string);
118 // Latin capital letter Y with diaeresis
119 $string = str_replace ("\276", "Ÿ", $string);
124 // ISO-8859-15 is Cyrillic
125 function charset_decode_iso_8859_5 ($string) {
126 // Convert to KOI8-R, then return this decoded.
127 $string = convert_cyr_string($string, "i", "k");
128 return charset_decode_koi8r($string);
131 // Remove all 8 bit characters from all other ISO-8859 character sets
132 function charset_decode_iso_8859_default ($string) {
133 return (strtr($string, "\240\241\242\243\244\245\246\247".
134 "\250\251\252\253\254\255\256\257".
135 "\260\261\262\263\264\265\266\267".
136 "\270\271\272\273\274\275\276\277".
137 "\300\301\302\303\304\305\306\307".
138 "\310\311\312\313\314\315\316\317".
139 "\320\321\322\323\324\325\326\327".
140 "\330\331\332\333\334\335\336\337".
141 "\340\341\342\343\344\345\346\347".
142 "\350\351\352\353\354\355\356\357".
143 "\360\361\362\363\364\365\366\367".
144 "\370\371\372\373\374\375\376\377",
145 "????????????????????????????????????????".
146 "????????????????????????????????????????".
147 "????????????????????????????????????????".
152 // This is the same as ISO-646-NO and is used by some
153 // Microsoft programs when sending Norwegian characters
154 function charset_decode_ns_4551_1 ($string) {
155 // These characters are:
156 // Latin capital letter AE
157 // Latin capital letter O with stroke
158 // Latin capital letter A with ring above
159 // and the same as small letters
160 return strtr ($string, "[\\]{|}", "ÆØÅæøå");
163 // KOI8-R is used to encode Russian mail (Cyrrilic). Defined in RFC
165 function charset_decode_koi8r ($string) {
166 global $default_charset;
168 if ($default_charset == "koi8-r") {
171 // Convert to Unicode HTML entities.
172 // This code is rather ineffective.
173 $string = str_replace("\200", "─", $string);
174 $string = str_replace("\201", "│", $string);
175 $string = str_replace("\202", "┌", $string);
176 $string = str_replace("\203", "┐", $string);
177 $string = str_replace("\204", "└", $string);
178 $string = str_replace("\205", "┘", $string);
179 $string = str_replace("\206", "├", $string);
180 $string = str_replace("\207", "┤", $string);
181 $string = str_replace("\210", "┬", $string);
182 $string = str_replace("\211", "┴", $string);
183 $string = str_replace("\212", "┼", $string);
184 $string = str_replace("\213", "▀", $string);
185 $string = str_replace("\214", "▄", $string);
186 $string = str_replace("\215", "█", $string);
187 $string = str_replace("\216", "▌", $string);
188 $string = str_replace("\217", "▐", $string);
189 $string = str_replace("\220", "░", $string);
190 $string = str_replace("\221", "▒", $string);
191 $string = str_replace("\222", "▓", $string);
192 $string = str_replace("\223", "⌠", $string);
193 $string = str_replace("\224", "■", $string);
194 $string = str_replace("\225", "∙", $string);
195 $string = str_replace("\226", "√", $string);
196 $string = str_replace("\227", "≈", $string);
197 $string = str_replace("\230", "≤", $string);
198 $string = str_replace("\231", "≥", $string);
199 $string = str_replace("\232", " ", $string);
200 $string = str_replace("\233", "⌡", $string);
201 $string = str_replace("\234", "°", $string);
202 $string = str_replace("\235", "²", $string);
203 $string = str_replace("\236", "·", $string);
204 $string = str_replace("\237", "÷", $string);
205 $string = str_replace("\240", "═", $string);
206 $string = str_replace("\241", "║", $string);
207 $string = str_replace("\242", "╒", $string);
208 $string = str_replace("\243", "ё", $string);
209 $string = str_replace("\244", "╓", $string);
210 $string = str_replace("\245", "╔", $string);
211 $string = str_replace("\246", "╕", $string);
212 $string = str_replace("\247", "╖", $string);
213 $string = str_replace("\250", "╗", $string);
214 $string = str_replace("\251", "╘", $string);
215 $string = str_replace("\252", "╙", $string);
216 $string = str_replace("\253", "╚", $string);
217 $string = str_replace("\254", "╛", $string);
218 $string = str_replace("\255", "╜", $string);
219 $string = str_replace("\256", "╝", $string);
220 $string = str_replace("\257", "╞", $string);
221 $string = str_replace("\260", "╟", $string);
222 $string = str_replace("\261", "╠", $string);
223 $string = str_replace("\262", "╡", $string);
224 $string = str_replace("\263", "Ё", $string);
225 $string = str_replace("\264", "╢", $string);
226 $string = str_replace("\265", "╣", $string);
227 $string = str_replace("\266", "╤", $string);
228 $string = str_replace("\267", "╥", $string);
229 $string = str_replace("\270", "╦", $string);
230 $string = str_replace("\271", "╧", $string);
231 $string = str_replace("\272", "╨", $string);
232 $string = str_replace("\273", "╩", $string);
233 $string = str_replace("\274", "╪", $string);
234 $string = str_replace("\275", "╫", $string);
235 $string = str_replace("\276", "╬", $string);
236 $string = str_replace("\277", "©", $string);
237 $string = str_replace("\300", "ю", $string);
238 $string = str_replace("\301", "а", $string);
239 $string = str_replace("\302", "б", $string);
240 $string = str_replace("\303", "ц", $string);
241 $string = str_replace("\304", "д", $string);
242 $string = str_replace("\305", "е", $string);
243 $string = str_replace("\306", "ф", $string);
244 $string = str_replace("\307", "г", $string);
245 $string = str_replace("\310", "х", $string);
246 $string = str_replace("\311", "и", $string);
247 $string = str_replace("\312", "й", $string);
248 $string = str_replace("\313", "к", $string);
249 $string = str_replace("\314", "л", $string);
250 $string = str_replace("\315", "м", $string);
251 $string = str_replace("\316", "н", $string);
252 $string = str_replace("\317", "о", $string);
253 $string = str_replace("\320", "п", $string);
254 $string = str_replace("\321", "я", $string);
255 $string = str_replace("\322", "р", $string);
256 $string = str_replace("\323", "с", $string);
257 $string = str_replace("\324", "т", $string);
258 $string = str_replace("\325", "у", $string);
259 $string = str_replace("\326", "ж", $string);
260 $string = str_replace("\327", "в", $string);
261 $string = str_replace("\330", "ь", $string);
262 $string = str_replace("\331", "ы", $string);
263 $string = str_replace("\332", "з", $string);
264 $string = str_replace("\333", "ш", $string);
265 $string = str_replace("\334", "э", $string);
266 $string = str_replace("\335", "щ", $string);
267 $string = str_replace("\336", "ч", $string);
268 $string = str_replace("\337", "ъ", $string);
269 $string = str_replace("\340", "Ю", $string);
270 $string = str_replace("\341", "А", $string);
271 $string = str_replace("\342", "Б", $string);
272 $string = str_replace("\343", "Ц", $string);
273 $string = str_replace("\344", "Д", $string);
274 $string = str_replace("\345", "Е", $string);
275 $string = str_replace("\346", "Ф", $string);
276 $string = str_replace("\347", "Г", $string);
277 $string = str_replace("\350", "Х", $string);
278 $string = str_replace("\351", "И", $string);
279 $string = str_replace("\352", "Й", $string);
280 $string = str_replace("\353", "К", $string);
281 $string = str_replace("\354", "Л", $string);
282 $string = str_replace("\355", "М", $string);
283 $string = str_replace("\356", "Н", $string);
284 $string = str_replace("\357", "О", $string);
285 $string = str_replace("\360", "П", $string);
286 $string = str_replace("\361", "Я", $string);
287 $string = str_replace("\362", "Р", $string);
288 $string = str_replace("\363", "С", $string);
289 $string = str_replace("\364", "Т", $string);
290 $string = str_replace("\365", "У", $string);
291 $string = str_replace("\366", "Ж", $string);
292 $string = str_replace("\367", "В", $string);
293 $string = str_replace("\370", "Ь", $string);
294 $string = str_replace("\371", "Ы", $string);
295 $string = str_replace("\372", "З", $string);
296 $string = str_replace("\373", "Ш", $string);
297 $string = str_replace("\374", "Э", $string);
298 $string = str_replace("\375", "Щ", $string);
299 $string = str_replace("\376", "Ч", $string);
300 $string = str_replace("\377", "Ъ", $string);