6a4e9fe8426645cdcda2c8643f5af089af8d34fc
6 * Copyright (c) 1999-2002 The SquirrelMail Project Team
7 * Licensed under the GNU GPL. For full terms see the file COPYING.
9 * This contains the functions necessary to detect and decode MIME
15 require_once('../functions/imap.php');
16 require_once('../functions/attachment_common.php');
18 /** Setting up the objects that have the structure for the message **/
20 /** msg_header contains generic variables for values that **/
21 /** could be in a header. **/
23 var $type0 = '', $type1 = '', $boundary = '', $charset = '',
24 $encoding = '', $size = 0, $to = array(), $from = '', $date = '',
25 $cc = array(), $bcc = array(), $reply_to = '', $subject = '',
26 $id = 0, $mailbox = '', $description = '', $filename = '',
27 $entity_id = 0, $message_id = 0, $name = '', $priority = 3;
31 /** message is the object that contains messages. It is a recursive
32 object in that through the $entities variable, it can contain
33 more objects of type message. See documentation in mime.txt for
34 a better description of how this works.
37 var $entities = array();
39 function addEntity ($msg) {
40 $this->entities
[] = $msg;
44 /* --------------------------------------------------------------------------------- */
46 /* --------------------------------------------------------------------------------- */
48 /* This function gets the structure of a message and stores it in the "message" class.
49 * It will return this object for use with all relevant header information and
50 * fully parsed into the standard "message" object format.
52 function mime_structure ($imap_stream, $header) {
54 sqimap_messages_flag ($imap_stream, $header->id
, $header->id
, 'Seen');
55 $ssid = sqimap_session_id();
56 $lsid = strlen( $ssid );
58 fputs ($imap_stream, "$ssid FETCH $id BODYSTRUCTURE\r\n");
60 // This should use sqimap_read_data instead of reading it itself
62 $read = fgets ($imap_stream, 10000);
64 while ( substr($read, 0, $lsid) <> $ssid &&
65 !feof( $imap_stream ) ) {
66 $bodystructure .= $read;
67 $read = fgets ($imap_stream, 10000);
69 $read = $bodystructure;
71 // isolate the body structure and remove beginning and end parenthesis
72 $read = trim(substr ($read, strpos(strtolower($read), 'bodystructure') +
13));
73 $read = trim(substr ($read, 0, -1));
74 $end = mime_match_parenthesis(0, $read);
75 while ($end == strlen($read)-1) {
76 $read = trim(substr ($read, 0, -1));
77 $read = trim(substr ($read, 1));
78 $end = mime_match_parenthesis(0, $read);
81 $msg = mime_parse_structure ($read, 0);
82 $msg->header
= $header;
87 /* this starts the parsing of a particular structure. It is called recursively,
88 * so it can be passed different structures. It returns an object of type
90 * First, it checks to see if it is a multipart message. If it is, then it
91 * handles that as it sees is necessary. If it is just a regular entity,
92 * then it parses it and adds the necessary header information (by calling out
93 * to mime_get_elements()
95 function mime_parse_structure ($structure, $ent_id) {
98 if ($structure{0} == '(') {
99 $ent_id = mime_new_element_level($ent_id);
103 $end = mime_match_parenthesis ($start, $structure);
105 $element = substr($structure, $start+
1, ($end - $start)-1);
106 $ent_id = mime_increment_id ($ent_id);
107 $newmsg = mime_parse_structure ($element, $ent_id);
108 $msg->addEntity ($newmsg);
109 } while ($structure{$end+
1} == '(');
111 // parse the elements
112 $msg = mime_get_element ($structure, $msg, $ent_id);
117 /* Increments the element ID. An element id can look like any of
118 * the following: 1, 1.2, 4.3.2.4.1, etc. This function increments
119 * the last number of the element id, changing 1.2 to 1.3.
121 function mime_increment_id ($id) {
123 if (strpos($id, ".")) {
124 $first = substr($id, 0, strrpos($id, "."));
125 $last = substr($id, strrpos($id, ".")+
1);
127 $new = $first . "." .$last;
136 * See comment for mime_increment_id().
137 * This adds another level on to the entity_id changing 1.3 to 1.3.0
138 * NOTE: 1.3.0 is not a valid element ID. It MUST be incremented
139 * before it can be used. I left it this way so as not to have
140 * to make a special case if it is the first entity_id. It
141 * always increments it, and that works fine.
143 function mime_new_element_level ($id) {
154 function mime_get_element (&$structure, $msg, $ent_id) {
157 $msg->header
= new msg_header();
158 $msg->header
->entity_id
= $ent_id;
159 $properties = array();
161 while (strlen($structure) > 0) {
162 $structure = trim($structure);
163 $char = $structure{0};
165 if (strtolower(substr($structure, 0, 3)) == 'nil') {
167 $structure = substr($structure, 3);
168 } else if ($char == '"') {
169 // loop through until we find the matching quote, and return that as a string
172 while ( ($char = $structure{$pos} ) <> '"' && $pos < strlen($structure)) {
176 $structure = substr($structure, strlen($text) +
2);
177 } else if ($char == '(') {
179 $end = mime_match_parenthesis (0, $structure);
180 $sub = substr($structure, 1, $end-1);
181 $properties = mime_get_props($properties, $sub);
182 $structure = substr($structure, strlen($sub) +
2);
184 // loop through until we find a space or an end parenthesis
186 $char = $structure{$pos};
188 while ($char != ' ' && $char != ')' && $pos < strlen($structure)) {
191 $char = $structure{$pos};
193 $structure = substr($structure, strlen($text));
196 // This is where all the text parts get put into the header
199 $msg->header
->type0
= strtolower($text);
202 $msg->header
->type1
= strtolower($text);
205 // Invisimail enclose images with <>
206 $msg->header
->id
= str_replace( '<', '', str_replace( '>', '', $text ) );
209 $msg->header
->description
= $text;
212 $msg->header
->encoding
= strtolower($text);
215 $msg->header
->size
= $text;
218 if ($msg->header
->type0
== 'text' && $elem_num == 8) {
219 // This is a plain text message, so lets get the number of lines
221 $msg->header
->num_lines
= $text;
223 } else if ($msg->header
->type0
== 'message' && $msg->header
->type1
== 'rfc822' && $elem_num == 8) {
224 // This is an encapsulated message, so lets start all over again and
225 // parse this message adding it on to the existing one.
226 $structure = trim($structure);
227 if ( $structure{0} == '(' ) {
228 $e = mime_match_parenthesis (0, $structure);
229 $structure = substr($structure, 0, $e);
230 $structure = substr($structure, 1);
231 $m = mime_parse_structure($structure, $msg->header
->entity_id
);
233 // the following conditional is there to correct a bug that wasn't
234 // incrementing the entity IDs correctly because of the special case
235 // that message/rfc822 is. This fixes it fine.
236 if (substr($structure, 1, 1) != '(')
237 $m->header
->entity_id
= mime_increment_id(mime_new_element_level($ent_id));
239 // Now we'll go through and reformat the results.
241 for ($i=0; $i < count($m->entities
); $i++
) {
242 $msg->addEntity($m->entities
[$i]);
255 // loop through the additional properties and put those in the various headers
256 if ($msg->header
->type0
!= 'message') {
257 for ($i=0; $i < count($properties); $i++
) {
258 $msg->header
->{$properties[$i]['name']} = $properties[$i]['value'];
266 * I did most of the MIME stuff yesterday (June 20, 2000), but I couldn't
267 * figure out how to do this part, so I decided to go to bed. I woke up
268 * in the morning and had a flash of insight. I went to the white-board
269 * and scribbled it out, then spent a bit programming it, and this is the
270 * result. Nothing complicated, but I think my brain was fried yesterday.
271 * Funny how that happens some times.
273 * This gets properties in a nested parenthesisized list. For example,
274 * this would get passed something like: ("attachment" ("filename" "luke.tar.gz"))
275 * This returns an array called $props with all paired up properties.
276 * It ignores the "attachment" for now, maybe that should change later
277 * down the road. In this case, what is returned is:
278 * $props[0]["name"] = "filename";
279 * $props[0]["value"] = "luke.tar.gz";
281 function mime_get_props ($props, $structure) {
283 while (strlen($structure) > 0) {
284 $structure = trim($structure);
285 $char = $structure{0};
290 while ( ( $char = $structure{$pos} ) != '"' &&
291 $pos < strlen($structure)) {
295 $structure = trim(substr($structure, strlen($tmp) +
2));
296 $char = $structure{0};
301 while ( ( $char = $structure{$pos} ) != '"' &&
302 $pos < strlen($structure) ) {
306 $structure = trim(substr($structure, strlen($tmp) +
2));
309 $props[$k]['name'] = strtolower($tmp);
310 $props[$k]['value'] = $value;
311 } else if ($char == '(') {
312 $end = mime_match_parenthesis (0, $structure);
313 $sub = substr($structure, 1, $end-1);
316 $props = mime_get_props($props, $sub);
317 $structure = substr($structure, strlen($sub) +
2);
320 } else if ($char == '(') {
321 $end = mime_match_parenthesis (0, $structure);
322 $sub = substr($structure, 1, $end-1);
323 $props = mime_get_props($props, $sub);
324 $structure = substr($structure, strlen($sub) +
2);
333 * Matches parenthesis. It will return the position of the matching
334 * parenthesis in $structure. For instance, if $structure was:
335 * ("text" "plain" ("val1name", "1") nil ... )
337 * then this would return 42 to match up those two.
339 function mime_match_parenthesis ($pos, $structure) {
341 $j = strlen( $structure );
343 // ignore all extra characters
344 // If inside of a string, skip string -- Boundary IDs and other
345 // things can have ) in them.
346 if ( $structure{$pos} != '(' ) {
350 while ( $pos < $j ) {
352 if ($structure{$pos} == ')') {
354 } elseif ($structure{$pos} == '"') {
356 while ( $structure{$pos} != '"' &&
358 if (substr($structure, $pos, 2) == '\\"') {
360 } elseif (substr($structure, $pos, 2) == '\\\\') {
365 } elseif ( $structure{$pos} == '(' ) {
366 $pos = mime_match_parenthesis ($pos, $structure);
369 echo _("Error decoding mime structure. Report this as a bug!") . '<br>';
373 function mime_fetch_body ($imap_stream, $id, $ent_id ) {
376 * do a bit of error correction. If we couldn't find the entity id, just guess
377 * that it is the first one. That is usually the case anyway.
382 $data = sqimap_run_command ($imap_stream, "FETCH $id BODY[$ent_id]", true, $response, $message);
383 $topline = array_shift($data);
384 while (! ereg('\\* [0-9]+ FETCH ', $topline) && $data) {
385 $topline = array_shift($data);
387 $wholemessage = implode('', $data);
388 if (ereg('\\{([^\\}]*)\\}', $topline, $regs)) {
389 $ret = substr( $wholemessage, 0, $regs[1] );
391 There is some information in the content info header that could be important
392 in order to parse html messages. Let's get them here.
394 if ( $ret{0} == '<' ) {
395 $data = sqimap_run_command ($imap_stream, "FETCH $id BODY[$ent_id.MIME]", true, $response, $message);
398 foreach( $data as $d ) {
399 if ( substr( $d, 0, 13 ) == 'Content-Base:' ) {
404 ( !isNoSep( $d{$i} ) ||
$d{$i} == '"' ) )
407 if ( isNoSep( $d{$i} ) )
412 } elseif ( $k == 1 && !isnosep( $d{0} ) ) {
413 $base .= substr( $d, 1 );
419 $ret = "<base href=\"$base\">" . $ret;
421 } else if (ereg('"([^"]*)"', $topline, $regs)) {
424 global $where, $what, $mailbox, $passed_id, $startMessage;
425 $par = "mailbox=".urlencode($mailbox)."&passed_id=$passed_id";
426 if (isset($where) && isset($what)) {
427 $par .= "&where=".urlencode($where)."&what=".urlencode($what);
429 $par .= "&startMessage=$startMessage&show_more=0";
431 $par .= '&response='.urlencode($response).'&message='.urlencode($message).
432 '&topline='.urlencode($topline);
434 echo '<b><font color=$color[2]>' .
435 _("Body retrieval error. The reason for this is most probably that the message is malformed. Please help us making future versions better by submitting this message to the developers knowledgebase!") .
436 "<A HREF=\"../src/retrievalerror.php?$par\">Submit message</A><BR>" .
437 '<tt>' . _("Response:") . "$response<BR>" .
438 _("Message:") . " $message<BR>" .
439 _("FETCH line:") . " $topline ....<BR></tt></font></b>";
442 $data = sqimap_run_command ($imap_stream, "FETCH $passed_id BODY[]", true, $response, $message);
444 $wholemessage = implode('', $data);
446 $ret = "---------------\n$wholemessage";
452 function mime_print_body_lines ($imap_stream, $id, $ent_id, $encoding) {
453 // do a bit of error correction. If we couldn't find the entity id, just guess
454 // that it is the first one. That is usually the case anyway.
458 $sid = sqimap_session_id();
459 // Don't kill the connection if the browser is over a dialup
460 // and it would take over 30 seconds to download it.
462 // don´t call set_time_limit in safe mode.
463 if (!ini_get("safe_mode")) {
467 fputs ($imap_stream, "$sid FETCH $id BODY[$ent_id]\r\n");
470 $read = fgets ($imap_stream,4096);
471 // This could be bad -- if the section has sqimap_session_id() . ' OK'
472 // or similar, it will kill the download.
473 while (!ereg("^".$sid." (OK|BAD|NO)(.*)$", $read, $regs)) {
474 if (trim($read) == ')==') {
476 $read = fgets ($imap_stream,4096);
477 if (ereg("^".$sid." (OK|BAD|NO)(.*)$", $read, $regs)) {
480 echo decodeBody($read1, $encoding) .
481 decodeBody($read, $encoding);
484 echo decodeBody($read, $encoding);
486 $read = fgets ($imap_stream,4096);
491 /* -[ END MIME DECODING ]----------------------------------------------------------- */
495 /* This is the first function called. It decides if this is a multipart
496 message or if it should be handled as a single entity
498 function decodeMime ($imap_stream, &$header) {
499 global $username, $key, $imapServerAddress, $imapPort;
500 return mime_structure ($imap_stream, $header);
503 // This is here for debugging purposese. It will print out a list
504 // of all the entity IDs that are in the $message object.
506 function listEntities ($message) {
508 if ($message->header->entity_id)
509 echo "<tt>" . $message->header->entity_id . ' : ' . $message->header->type0 . '/' . $message->header->type1 . '<br>';
510 for ($i = 0; $message->entities[$i]; $i++) {
511 $msg = listEntities($message->entities[$i], $ent_id);
519 /* returns a $message object for a particular entity id */
520 function getEntity ($message, $ent_id) {
522 if ($message->header
->entity_id
== $ent_id && strlen($ent_id) == strlen($message->header
->entity_id
)) {
525 for ($i = 0; isset($message->entities
[$i]); $i++
) {
526 $msg = getEntity ($message->entities
[$i], $ent_id);
536 * figures out what entity to display and returns the $message object
539 function findDisplayEntity ($message, $textOnly = 1) {
540 global $show_html_default;
545 if ( $message->header
->type0
== 'multipart' &&
546 ( $message->header
->type1
== 'alternative' ||
547 $message->header
->type1
== 'related' ) &&
548 $show_html_default && ! $textOnly ) {
549 $entity = findDisplayEntityHTML($message);
552 // Show text/plain or text/html -- the first one we find.
554 $message->header
->type0
== 'text' &&
555 ( $message->header
->type1
== 'plain' ||
556 $message->header
->type1
== 'html' ) &&
557 isset($message->header
->entity_id
) ) {
558 $entity = $message->header
->entity_id
;
562 while ($entity == 0 && isset($message->entities
[$i]) ) {
563 $entity = findDisplayEntity($message->entities
[$i], $textOnly);
571 /* Shows the HTML version */
572 function findDisplayEntityHTML ($message) {
574 if ( $message->header
->type0
== 'text' &&
575 $message->header
->type1
== 'html' &&
576 isset($message->header
->entity_id
)) {
577 return $message->header
->entity_id
;
579 for ($i = 0; isset($message->entities
[$i]); $i ++
) {
580 $entity = findDisplayEntityHTML($message->entities
[$i]);
589 /* This returns a parsed string called $body. That string can then
590 be displayed as the actual message in the HTML. It contains
591 everything needed, including HTML Tags, Attachments at the
594 function formatBody($imap_stream, $message, $color, $wrap_at) {
595 // this if statement checks for the entity to show as the
596 // primary message. To add more of them, just put them in the
597 // order that is their priority.
598 global $startMessage, $username, $key, $imapServerAddress, $imapPort,
601 $id = $message->header
->id
;
602 $urlmailbox = urlencode($message->header
->mailbox
);
604 // Get the right entity and redefine message to be this entity
605 // Pass the 0 to mean that we want the 'best' viewable one
606 $ent_num = findDisplayEntity ($message, 0);
607 $body_message = getEntity($message, $ent_num);
608 if (($body_message->header
->type0
== 'text') ||
609 ($body_message->header
->type0
== 'rfc822')) {
611 $body = mime_fetch_body ($imap_stream, $id, $ent_num);
612 $body = decodeBody($body, $body_message->header
->encoding
);
613 $hookResults = do_hook("message_body", $body);
614 $body = $hookResults[1];
616 // If there are other types that shouldn't be formatted, add
618 if ($body_message->header
->type1
== 'html') {
619 if ( $show_html_default <> 1 ) {
620 $body = strip_tags( $body );
621 translateText($body, $wrap_at, $body_message->header
->charset
);
623 $body = MagicHTML( $body, $id );
626 translateText($body, $wrap_at, $body_message->header
->charset
);
629 $body .= "<SMALL><CENTER><A HREF=\"../src/download.php?absolute_dl=true&passed_id=$id&passed_ent_id=$ent_num&mailbox=$urlmailbox&showHeaders=1\">". _("Download this as a file") ."</A></CENTER><BR></SMALL>";
631 /** Display the ATTACHMENTS: message if there's more than one part **/
632 $body .= "</TD></TR></TABLE>";
633 if (isset($message->entities
[0])) {
634 $body .= formatAttachments ($message, $ent_num, $message->header
->mailbox
, $id);
636 $body .= "</TD></TR></TABLE>";
638 $body = formatAttachments ($message, -1, $message->header
->mailbox
, $id);
644 * A recursive function that returns a list of attachments with links
645 * to where to download these attachments
647 function formatAttachments ($message, $ent_id, $mailbox, $id) {
648 global $where, $what;
649 global $startMessage, $color;
650 static $ShownHTML = 0;
653 if ($ShownHTML == 0) {
656 $body .= "<TABLE WIDTH=\"100%\" CELLSPACING=0 CELLPADDING=2 BORDER=0 BGCOLOR=\"$color[0]\"><TR>\n" .
657 "<TH ALIGN=\"left\" BGCOLOR=\"$color[9]\"><B>\n" .
658 _("Attachments") . ':' .
659 "</B></TH></TR><TR><TD>\n" .
660 "<TABLE CELLSPACING=0 CELLPADDING=1 BORDER=0>\n" .
661 formatAttachments ($message, $ent_id, $mailbox, $id) .
662 "</TABLE></TD></TR></TABLE>";
668 if (!$message->entities
) {
669 $type0 = strtolower($message->header
->type0
);
670 $type1 = strtolower($message->header
->type1
);
671 $name = decodeHeader($message->header
->name
);
673 if ($message->header
->entity_id
!= $ent_id) {
674 $filename = decodeHeader($message->header
->filename
);
675 if (trim($filename) == '') {
676 if (trim($name) == '') {
677 if ( trim( $message->header
->id
) == '' )
678 $display_filename = 'untitled-[' . $message->header
->entity_id
. ']' ;
680 $display_filename = 'cid: ' . $message->header
->id
;
681 // $display_filename = 'untitled-[' . $message->header->entity_id . ']' ;
683 $display_filename = $name;
687 $display_filename = $filename;
690 $urlMailbox = urlencode($mailbox);
691 $ent = urlencode($message->header
->entity_id
);
694 "../src/download.php?startMessage=$startMessage&passed_id=$id&mailbox=$urlMailbox&passed_ent_id=$ent";
696 $DefaultLink .= '&where=' . urlencode($where) . '&what=' . urlencode($what);
697 $Links['download link']['text'] = _("download");
698 $Links['download link']['href'] =
699 "../src/download.php?absolute_dl=true&passed_id=$id&mailbox=$urlMailbox&passed_ent_id=$ent";
702 /* this executes the attachment hook with a specific MIME-type.
703 * if that doens't have results, it tries if there's a rule
704 * for a more generic type. */
705 $HookResults = do_hook("attachment $type0/$type1", $Links,
706 $startMessage, $id, $urlMailbox, $ent, $DefaultLink,
707 $display_filename, $where, $what);
708 if(count($HookResults[1]) <= 1) {
709 $HookResults = do_hook("attachment $type0/*", $Links,
710 $startMessage, $id, $urlMailbox, $ent, $DefaultLink,
711 $display_filename, $where, $what);
714 $Links = $HookResults[1];
715 $DefaultLink = $HookResults[6];
717 $body .= '<TR><TD> </TD><TD>' .
718 "<A HREF=\"$DefaultLink\">$display_filename</A> </TD>" .
719 '<TD><SMALL><b>' . show_readable_size($message->header
->size
) .
720 '</b> </small></TD>' .
721 "<TD><SMALL>[ $type0/$type1 ] </SMALL></TD>" .
723 if ($message->header
->description
)
724 $body .= '<b>' . htmlspecialchars($message->header
->description
) . '</b>';
725 $body .= '</SMALL></TD><TD><SMALL> ';
729 foreach ($Links as $Val) {
733 $body .= ' | ';
735 $body .= '<a href="' . $Val['href'] . '">' . $Val['text'] . '</a>';
740 $body .= "</SMALL></TD></TR>\n";
743 for ($i = 0; $i < count($message->entities
); $i++
) {
744 $body .= formatAttachments ($message->entities
[$i], $ent_id, $mailbox, $id);
752 /** this function decodes the body depending on the encoding type. **/
753 function decodeBody($body, $encoding) {
754 $body = str_replace("\r\n", "\n", $body);
755 $encoding = strtolower($encoding);
757 global $show_html_default;
759 if ($encoding == 'quoted-printable') {
760 $body = quoted_printable_decode($body);
763 while (ereg("=\n", $body))
764 $body = ereg_replace ("=\n", "", $body);
766 } else if ($encoding == 'base64') {
767 $body = base64_decode($body);
770 // All other encodings are returned raw.
775 * This functions decode strings that is encoded according to
776 * RFC1522 (MIME Part Two: Message Header Extensions for Non-ASCII Text).
778 function decodeHeader ($string, $utfencode=true) {
780 if ( is_array( $string ) ) {
781 $string = implode("\n", $string );
784 if (eregi('=\\?([^?]+)\\?(q|b)\\?([^?]+)\\?=',
786 if (ucfirst($res[2]) == 'B') {
787 $replace = base64_decode($res[3]);
789 $replace = str_replace('_', ' ', $res[3]);
790 // Convert lowercase Quoted Printable to uppercase for
791 // quoted_printable_decode to understand it.
792 while (ereg("(=(([0-9][abcdef])|([abcdef][0-9])|([abcdef][abcdef])))",
794 $replace = str_replace($res[1], strtoupper($res[1]), $replace);
796 $replace = quoted_printable_decode($replace);
798 /* Only encode into entities by default. Some places
799 don't need the encoding, like the compose form. */
801 $replace = charset_decode ($res[1], $replace);
804 // Remove the name of the character set.
805 $string = eregi_replace ('=\\?([^?]+)\\?(q|b)\\?([^?]+)\\?=',
808 // In case there should be more encoding in the string: recurse
809 $string = decodeHeader($string);
816 * Encode a string according to RFC 1522 for use in headers if it
817 * contains 8-bit characters or anything that looks like it should
820 function encodeHeader ($string) {
821 global $default_charset;
823 // Encode only if the string contains 8-bit characters or =?
824 $j = strlen( $string );
825 $l = strstr($string, '=?'); // Must be encoded ?
827 for( $i=0; $i < $j; ++
$i) {
828 switch( $string{$i} ) {
842 $k = ord( $string{$i} );
844 $ret .= sprintf("=%02X", $k);
852 $string = "=?$default_charset?Q?$ret?=";
859 Strips dangerous tags from html messages.
861 function MagicHTML( $body, $id ) {
863 global $message, $HTTP_SERVER_VARS,
864 $attachment_common_show_images;
866 $attachment_common_show_images =
867 FALSE; // Don't display attached images in HTML mode
868 $j = strlen( $body ); // Legnth of the HTML
869 $ret = ''; // Returned string
870 $bgcolor = '#ffffff'; // Background style color (defaults to white)
871 $textcolor = '#000000'; // Foreground style color (defaults to black)
872 $leftmargin = ''; // Left margin style
873 $title = ''; // HTML title if any
877 if ( $body{$i} == '<' ) {
880 while ($body{$pos} == ' ' ||
$body{$pos} == "\t" ||
881 $body{$pos} == "\n") {
884 while (strlen($tag) < 4 && $body{$pos} != ' ' &&
885 $body{$pos} != "\t" && $body{$pos} != "\n") {
889 switch( strtoupper( $tag ) ) {
890 // Strips the entire tag and contents
897 while ( $body{$i+
1}.$body{$i+
2}.$body{$i+
3}.$body{$i+
4}.$body{$i+
5} <> $etg &&
899 while ( $i < $j && $body{++
$i} <> '>' );
900 // $ret .= "<!-- $tag removed -->";
905 while ( $body{$i} <> '>' && // </title>
910 while ( $body{$i} <> '<' && // </title>
917 // Destroy these tags
928 while ( $body{$i} <> '>' &&
935 while ( $body{$i} <> '>' && // </title>
939 // We parse the style to look for interesting stuff
941 while ( $body{$i} <> '>' &&
943 // First we get the name of the style
945 while ( $body{$i} <> '>' &&
949 if ( isnoSep( $body{$i} ) )
953 stripComments( $i, $j, $body );
954 $style = strtoupper( trim( $style ) );
955 if ( $style == 'BODY' ) {
956 // Next we look into the definitions of the body style
957 while ( $body{$i} <> '>' &&
960 // We look for the background color if any.
961 if ( substr( $body, $i, 17 ) == 'BACKGROUND-COLOR:' ) {
963 $bgcolor = getStyleData( $i, $j, $body );
964 } elseif ( substr( $body, $i, 12 ) == 'MARGIN-LEFT:' ) {
966 $leftmargin = getStyleData( $i, $j, $body );
971 // Other style are mantained
972 $styleblk .= "$style ";
973 while ( $body{$i} <> '>' &&
977 $styleblk .= $body{$i};
980 $styleblk .= $body{$i};
982 stripComments( $i, $j, $body );
983 if ( $body{$i} <> '>' )
986 if ( $styleblk <> '' )
987 $ret .= "<style>$styleblk";
991 $ret .= '<b>' . _("Title:") . " </b>$title<br>\n";
994 if (! isset($base)) {
997 $ret .= stripEvent( $i, $j, $body, $id, $base );
998 $ret .= " bgcolor=$bgcolor width=\"100%\"><tr>";
999 if ( $leftmargin <> '' )
1000 $ret .= "<td width=$leftmargin> </td>";
1002 if (strtolower($bgcolor) == 'ffffff' ||
1003 strtolower($bgcolor) == '#ffffff')
1004 $ret .= '<font color=#000000>';
1009 while ( !isNoSep( $body{$i} ) &&
1013 if ( strcasecmp( substr( $base, 0, 4 ), 'href' ) ) {
1015 while ( !isNoSep( $body{$i} ) &&
1019 while ( $body{$i} <> '>' &&
1021 if ( $body{$i} <> '"' ) {
1026 // Debuging $ret .= "<!-- base == $base -->";
1027 if ( strcasecmp( substr( $base, 0, 4 ), 'file' ) <> 0 ) {
1028 $ret .= "\n<BASE HREF=\"$base\">\n";
1033 $ret .= '</font></td></tr></TABLE>';
1037 // Following tags can contain some event handler, lets search it
1038 stripComments( $i, $j, $body );
1039 if (! isset($base)) {
1042 $ret .= stripEvent( $i, $j, $body, $id, $base ) . '>';
1043 // $ret .= "<!-- $tag detected -->";
1051 return( "\n\n<!-- HTML Output ahead -->\n" .
1053 "\n<!-- END of HTML Output --><base href=\"".
1054 get_location() . '/'.
1058 function isNoSep( $char ) {
1076 The following function is usefull to remove extra data that can cause
1077 html not to display properly. Especialy with MS stuff.
1080 function stripComments( &$i, $j, &$body ) {
1082 while ( $body{$i}.$body{$i+
1}.$body{$i+
2}.$body{$i+
3} == '<!--' &&
1085 while ( $body{$i-2}.$body{$i-1}.$body{$i} <> '-->' &&
1095 /* Gets the style data of a specific style */
1097 function getStyleData( &$i, $j, &$body ) {
1100 while ( $body{$i} <> '>' && !isNoSep( $body{$i} ) &&
1104 // And get the color
1106 while ( isNoSep( $body{$i} ) &&
1116 Private function for strip_dangerous_tag. Look for event based coded and "remove" it
1117 change on with no (onload -> noload)
1120 function stripEvent( &$i, $j, &$body, $id, $base ) {
1122 global $message, $base_uri;
1126 while ( $body{$i} <> '>' &&
1128 $etg = strtolower($body{$i}.$body{$i+
1}.$body{$i+
2});
1131 // This is probably a src specification
1133 while( !isNoSep( $body{$k} )) {
1136 if ( $body{$k} == '=' ) {
1139 while( !isNoSep( $body{$k} ) &&
1144 while ( $body{$k} <> '>' && isNoSep( $body{$k} ) &&
1149 while( !isNoSep( $body{$k} ) &&
1153 if ( strtolower( substr( $src, 0, 4 ) ) == 'cid:' ) {
1154 $src = substr( $src, 4 );
1155 $src = "../src/download.php?absolute_dl=true&passed_id=$id&mailbox=" .
1156 urlencode( $message->header
->mailbox
) .
1157 "&passed_ent_id=" . find_ent_id( $src, $message );
1158 } else if ( strtolower( substr( $src, 0, 4 ) ) <> 'http' ||
1159 stristr( $src, $base_uri ) ) {
1160 /* Javascript and local urls goes out */
1161 $src = '../images/' . _("sec_remove_eng.png");
1163 $ret .= 'src="' . $src . '" ';
1172 // Retrolinks are not allowed without a base because they mess with SM security
1173 if ( $base == '' ) {
1182 if ( $body{$i+
3} == ':') {
1185 while ( isNoSep( $body{$i} ) &&
1187 $name .= $body{$i++
};
1189 if ( $name <> '' ) {
1190 $ret .= "../src/download.php?absolute_dl=true&passed_id=$id&mailbox=" .
1191 urlencode( $message->header
->mailbox
) .
1192 "&passed_ent_id=" . find_ent_id( $name, $message );
1193 if ( $body{$k} == '"' )
1198 if ( $body{$i} == '>' )
1210 if ( strcasecmp( $body{$i-4}.$body{$i-3}.$body{$i-2}.$body{$i-1}.$body{$i}.$body{$i+
1}.$body{$i+
2}, 'script:') == 0 ) {
1226 /* This function trys to locate the entity_id of a specific mime element */
1228 function find_ent_id( $id, $message ) {
1231 for ($i=0; $ret == '' && $i < count($message->entities
); $i++
) {
1233 if ( $message->entities
[$i]->header
->entity_id
== '' ) {
1234 $ret = find_ent_id( $id, $message->entities
[$i] );
1236 if ( strcasecmp( $message->entities
[$i]->header
->id
, $id ) == 0 )
1237 $ret = $message->entities
[$i]->header
->entity_id
;