d0fc0c25e8ec94966708e6afd295e112639ffd89
[exim.git] / src / src / receive.c
1 /*************************************************
2 * Exim - an Internet mail transport agent *
3 *************************************************/
4
5 /* Copyright (c) University of Cambridge 1995 - 2012 */
6 /* See the file NOTICE for conditions of use and distribution. */
7
8 /* Code for receiving a message and setting up spool files. */
9
10 #include "exim.h"
11
12 #ifdef EXPERIMENTAL_DCC
13 extern int dcc_ok;
14 #endif
15
16 /*************************************************
17 * Local static variables *
18 *************************************************/
19
20 static FILE *data_file = NULL;
21 static int data_fd = -1;
22 static uschar spool_name[256];
23
24
25
26 /*************************************************
27 * Non-SMTP character reading functions *
28 *************************************************/
29
30 /* These are the default functions that are set up in the variables such as
31 receive_getc initially. They just call the standard functions, passing stdin as
32 the file. (When SMTP input is occurring, different functions are used by
33 changing the pointer variables.) */
34
35 int
36 stdin_getc(void)
37 {
38 return getc(stdin);
39 }
40
41 int
42 stdin_ungetc(int c)
43 {
44 return ungetc(c, stdin);
45 }
46
47 int
48 stdin_feof(void)
49 {
50 return feof(stdin);
51 }
52
53 int
54 stdin_ferror(void)
55 {
56 return ferror(stdin);
57 }
58
59
60
61
62 /*************************************************
63 * Check that a set sender is allowed *
64 *************************************************/
65
66 /* This function is called when a local caller sets an explicit sender address.
67 It checks whether this is permitted, which it is for trusted callers.
68 Otherwise, it must match the pattern(s) in untrusted_set_sender.
69
70 Arguments: the proposed sender address
71 Returns: TRUE for a trusted caller
72 TRUE if the address has been set, untrusted_set_sender has been
73 set, and the address matches something in the list
74 FALSE otherwise
75 */
76
77 BOOL
78 receive_check_set_sender(uschar *newsender)
79 {
80 uschar *qnewsender;
81 if (trusted_caller) return TRUE;
82 if (newsender == NULL || untrusted_set_sender == NULL) return FALSE;
83 qnewsender = (Ustrchr(newsender, '@') != NULL)?
84 newsender : string_sprintf("%s@%s", newsender, qualify_domain_sender);
85 return
86 match_address_list(qnewsender, TRUE, TRUE, &untrusted_set_sender, NULL, -1,
87 0, NULL) == OK;
88 }
89
90
91
92
93 /*************************************************
94 * Read space info for a partition *
95 *************************************************/
96
97 /* This function is called by receive_check_fs() below, and also by string
98 expansion for variables such as $spool_space. The field names for the statvfs
99 structure are macros, because not all OS have F_FAVAIL and it seems tidier to
100 have macros for F_BAVAIL and F_FILES as well. Some kinds of file system do not
101 have inodes, and they return -1 for the number available.
102
103 Later: It turns out that some file systems that do not have the concept of
104 inodes return 0 rather than -1. Such systems should also return 0 for the total
105 number of inodes, so we require that to be greater than zero before returning
106 an inode count.
107
108 Arguments:
109 isspool TRUE for spool partition, FALSE for log partition
110 inodeptr address of int to receive inode count; -1 if there isn't one
111
112 Returns: available on-root space, in kilobytes
113 -1 for log partition if there isn't one
114
115 All values are -1 if the STATFS functions are not available.
116 */
117
118 int
119 receive_statvfs(BOOL isspool, int *inodeptr)
120 {
121 #ifdef HAVE_STATFS
122 struct STATVFS statbuf;
123 uschar *path;
124 uschar *name;
125 uschar buffer[1024];
126
127 /* The spool directory must always exist. */
128
129 if (isspool)
130 {
131 path = spool_directory;
132 name = US"spool";
133 }
134
135 /* Need to cut down the log file path to the directory, and to ignore any
136 appearance of "syslog" in it. */
137
138 else
139 {
140 int sep = ':'; /* Not variable - outside scripts use */
141 uschar *p = log_file_path;
142 name = US"log";
143
144 /* An empty log_file_path means "use the default". This is the same as an
145 empty item in a list. */
146
147 if (*p == 0) p = US":";
148 while ((path = string_nextinlist(&p, &sep, buffer, sizeof(buffer))) != NULL)
149 {
150 if (Ustrcmp(path, "syslog") != 0) break;
151 }
152
153 if (path == NULL) /* No log files */
154 {
155 *inodeptr = -1;
156 return -1;
157 }
158
159 /* An empty string means use the default, which is in the spool directory.
160 But don't just use the spool directory, as it is possible that the log
161 subdirectory has been symbolically linked elsewhere. */
162
163 if (path[0] == 0)
164 {
165 sprintf(CS buffer, CS"%s/log", CS spool_directory);
166 path = buffer;
167 }
168 else
169 {
170 uschar *cp;
171 if ((cp = Ustrrchr(path, '/')) != NULL) *cp = 0;
172 }
173 }
174
175 /* We now have the path; do the business */
176
177 memset(&statbuf, 0, sizeof(statbuf));
178
179 if (STATVFS(CS path, &statbuf) != 0)
180 {
181 log_write(0, LOG_MAIN|LOG_PANIC, "cannot accept message: failed to stat "
182 "%s directory %s: %s", name, spool_directory, strerror(errno));
183 smtp_closedown(US"spool or log directory problem");
184 exim_exit(EXIT_FAILURE);
185 }
186
187 *inodeptr = (statbuf.F_FILES > 0)? statbuf.F_FAVAIL : -1;
188
189 /* Disks are getting huge. Take care with computing the size in kilobytes. */
190
191 return (int)(((double)statbuf.F_BAVAIL * (double)statbuf.F_FRSIZE)/1024.0);
192
193 /* Unable to find partition sizes in this environment. */
194
195 #else
196 *inodeptr = -1;
197 return -1;
198 #endif
199 }
200
201
202
203
204 /*************************************************
205 * Check space on spool and log partitions *
206 *************************************************/
207
208 /* This function is called before accepting a message; if any thresholds are
209 set, it checks them. If a message_size is supplied, it checks that there is
210 enough space for that size plus the threshold - i.e. that the message won't
211 reduce the space to the threshold. Not all OS have statvfs(); for those that
212 don't, this function always returns TRUE. For some OS the old function and
213 struct name statfs is used; that is handled by a macro, defined in exim.h.
214
215 Arguments:
216 msg_size the (estimated) size of an incoming message
217
218 Returns: FALSE if there isn't enough space, or if the information cannot
219 be obtained
220 TRUE if no check was done or there is enough space
221 */
222
223 BOOL
224 receive_check_fs(int msg_size)
225 {
226 int space, inodes;
227
228 if (check_spool_space > 0 || msg_size > 0 || check_spool_inodes > 0)
229 {
230 space = receive_statvfs(TRUE, &inodes);
231
232 DEBUG(D_receive)
233 debug_printf("spool directory space = %dK inodes = %d "
234 "check_space = %dK inodes = %d msg_size = %d\n",
235 space, inodes, check_spool_space, check_spool_inodes, msg_size);
236
237 if ((space >= 0 && space < check_spool_space) ||
238 (inodes >= 0 && inodes < check_spool_inodes))
239 {
240 log_write(0, LOG_MAIN, "spool directory space check failed: space=%d "
241 "inodes=%d", space, inodes);
242 return FALSE;
243 }
244 }
245
246 if (check_log_space > 0 || check_log_inodes > 0)
247 {
248 space = receive_statvfs(FALSE, &inodes);
249
250 DEBUG(D_receive)
251 debug_printf("log directory space = %dK inodes = %d "
252 "check_space = %dK inodes = %d\n",
253 space, inodes, check_log_space, check_log_inodes);
254
255 if ((space >= 0 && space < check_log_space) ||
256 (inodes >= 0 && inodes < check_log_inodes))
257 {
258 log_write(0, LOG_MAIN, "log directory space check failed: space=%d "
259 "inodes=%d", space, inodes);
260 return FALSE;
261 }
262 }
263
264 return TRUE;
265 }
266
267
268
269 /*************************************************
270 * Bomb out while reading a message *
271 *************************************************/
272
273 /* The common case of wanting to bomb out is if a SIGTERM or SIGINT is
274 received, or if there is a timeout. A rarer case might be if the log files are
275 screwed up and Exim can't open them to record a message's arrival. Handling
276 that case is done by setting a flag to cause the log functions to call this
277 function if there is an ultimate disaster. That is why it is globally
278 accessible.
279
280 Arguments:
281 reason text reason to pass to the not-quit ACL
282 msg default SMTP response to give if in an SMTP session
283 Returns: it doesn't
284 */
285
286 void
287 receive_bomb_out(uschar *reason, uschar *msg)
288 {
289 /* If spool_name is set, it contains the name of the data file that is being
290 written. Unlink it before closing so that it cannot be picked up by a delivery
291 process. Ensure that any header file is also removed. */
292
293 if (spool_name[0] != 0)
294 {
295 Uunlink(spool_name);
296 spool_name[Ustrlen(spool_name) - 1] = 'H';
297 Uunlink(spool_name);
298 }
299
300 /* Now close the file if it is open, either as a fd or a stream. */
301
302 if (data_file != NULL) (void)fclose(data_file);
303 else if (data_fd >= 0) (void)close(data_fd);
304
305 /* Attempt to close down an SMTP connection tidily. For non-batched SMTP, call
306 smtp_notquit_exit(), which runs the NOTQUIT ACL, if present, and handles the
307 SMTP response. */
308
309 if (smtp_input)
310 {
311 if (smtp_batched_input)
312 moan_smtp_batch(NULL, "421 %s - message abandoned", msg); /* No return */
313 smtp_notquit_exit(reason, US"421", US"%s %s - closing connection.",
314 smtp_active_hostname, msg);
315 }
316
317 /* Exit from the program (non-BSMTP cases) */
318
319 exim_exit(EXIT_FAILURE);
320 }
321
322
323 /*************************************************
324 * Data read timeout *
325 *************************************************/
326
327 /* Handler function for timeouts that occur while reading the data that
328 comprises a message.
329
330 Argument: the signal number
331 Returns: nothing
332 */
333
334 static void
335 data_timeout_handler(int sig)
336 {
337 uschar *msg = NULL;
338
339 sig = sig; /* Keep picky compilers happy */
340
341 if (smtp_input)
342 {
343 msg = US"SMTP incoming data timeout";
344 log_write(L_lost_incoming_connection,
345 LOG_MAIN, "SMTP data timeout (message abandoned) on connection "
346 "from %s F=<%s>",
347 (sender_fullhost != NULL)? sender_fullhost : US"local process",
348 sender_address);
349 }
350 else
351 {
352 fprintf(stderr, "exim: timed out while reading - message abandoned\n");
353 log_write(L_lost_incoming_connection,
354 LOG_MAIN, "timed out while reading local message");
355 }
356
357 receive_bomb_out(US"data-timeout", msg); /* Does not return */
358 }
359
360
361
362 /*************************************************
363 * local_scan() timeout *
364 *************************************************/
365
366 /* Handler function for timeouts that occur while running a local_scan()
367 function.
368
369 Argument: the signal number
370 Returns: nothing
371 */
372
373 static void
374 local_scan_timeout_handler(int sig)
375 {
376 sig = sig; /* Keep picky compilers happy */
377 log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function timed out - "
378 "message temporarily rejected (size %d)", message_size);
379 /* Does not return */
380 receive_bomb_out(US"local-scan-timeout", US"local verification problem");
381 }
382
383
384
385 /*************************************************
386 * local_scan() crashed *
387 *************************************************/
388
389 /* Handler function for signals that occur while running a local_scan()
390 function.
391
392 Argument: the signal number
393 Returns: nothing
394 */
395
396 static void
397 local_scan_crash_handler(int sig)
398 {
399 log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function crashed with "
400 "signal %d - message temporarily rejected (size %d)", sig, message_size);
401 /* Does not return */
402 receive_bomb_out(US"local-scan-error", US"local verification problem");
403 }
404
405
406 /*************************************************
407 * SIGTERM or SIGINT received *
408 *************************************************/
409
410 /* Handler for SIGTERM or SIGINT signals that occur while reading the
411 data that comprises a message.
412
413 Argument: the signal number
414 Returns: nothing
415 */
416
417 static void
418 data_sigterm_sigint_handler(int sig)
419 {
420 uschar *msg = NULL;
421
422 if (smtp_input)
423 {
424 msg = US"Service not available - SIGTERM or SIGINT received";
425 log_write(0, LOG_MAIN, "%s closed after %s", smtp_get_connection_info(),
426 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
427 }
428 else
429 {
430 if (filter_test == FTEST_NONE)
431 {
432 fprintf(stderr, "\nexim: %s received - message abandoned\n",
433 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
434 log_write(0, LOG_MAIN, "%s received while reading local message",
435 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
436 }
437 }
438
439 receive_bomb_out(US"signal-exit", msg); /* Does not return */
440 }
441
442
443
444 /*************************************************
445 * Add new recipient to list *
446 *************************************************/
447
448 /* This function builds a list of recipient addresses in argc/argv
449 format.
450
451 Arguments:
452 recipient the next address to add to recipients_list
453 pno parent number for fixed aliases; -1 otherwise
454
455 Returns: nothing
456 */
457
458 void
459 receive_add_recipient(uschar *recipient, int pno)
460 {
461 if (recipients_count >= recipients_list_max)
462 {
463 recipient_item *oldlist = recipients_list;
464 int oldmax = recipients_list_max;
465 recipients_list_max = recipients_list_max? 2*recipients_list_max : 50;
466 recipients_list = store_get(recipients_list_max * sizeof(recipient_item));
467 if (oldlist != NULL)
468 memcpy(recipients_list, oldlist, oldmax * sizeof(recipient_item));
469 }
470
471 recipients_list[recipients_count].address = recipient;
472 recipients_list[recipients_count].pno = pno;
473 #ifdef EXPERIMENTAL_BRIGHTMAIL
474 recipients_list[recipients_count].bmi_optin = bmi_current_optin;
475 /* reset optin string pointer for next recipient */
476 bmi_current_optin = NULL;
477 #endif
478 recipients_list[recipients_count++].errors_to = NULL;
479 }
480
481
482
483
484 /*************************************************
485 * Remove a recipient from the list *
486 *************************************************/
487
488 /* This function is provided for local_scan() to use.
489
490 Argument:
491 recipient address to remove
492
493 Returns: TRUE if it did remove something; FALSE otherwise
494 */
495
496 BOOL
497 receive_remove_recipient(uschar *recipient)
498 {
499 int count;
500 DEBUG(D_receive) debug_printf("receive_remove_recipient(\"%s\") called\n",
501 recipient);
502 for (count = 0; count < recipients_count; count++)
503 {
504 if (Ustrcmp(recipients_list[count].address, recipient) == 0)
505 {
506 if ((--recipients_count - count) > 0)
507 memmove(recipients_list + count, recipients_list + count + 1,
508 (recipients_count - count)*sizeof(recipient_item));
509 return TRUE;
510 }
511 }
512 return FALSE;
513 }
514
515
516
517
518
519 /*************************************************
520 * Read data portion of a non-SMTP message *
521 *************************************************/
522
523 /* This function is called to read the remainder of a message (following the
524 header) when the input is not from SMTP - we are receiving a local message on
525 a standard input stream. The message is always terminated by EOF, and is also
526 terminated by a dot on a line by itself if the flag dot_ends is TRUE. Split the
527 two cases for maximum efficiency.
528
529 Ensure that the body ends with a newline. This will naturally be the case when
530 the termination is "\n.\n" but may not be otherwise. The RFC defines messages
531 as "sequences of lines" - this of course strictly applies only to SMTP, but
532 deliveries into BSD-type mailbox files also require it. Exim used to have a
533 flag for doing this at delivery time, but as it was always set for all
534 transports, I decided to simplify things by putting the check here instead.
535
536 There is at least one MUA (dtmail) that sends CRLF via this interface, and
537 other programs are known to do this as well. Exim used to have a option for
538 dealing with this: in July 2003, after much discussion, the code has been
539 changed to default to treat any of LF, CRLF, and bare CR as line terminators.
540
541 However, for the case when a dot on a line by itself terminates a message, the
542 only recognized terminating sequences before and after the dot are LF and CRLF.
543 Otherwise, having read EOL . CR, you don't know whether to read another
544 character or not.
545
546 Internally, in messages stored in Exim's spool files, LF is used as the line
547 terminator. Under the new regime, bare CRs will no longer appear in these
548 files.
549
550 Arguments:
551 fout a FILE to which to write the message
552
553 Returns: One of the END_xxx values indicating why it stopped reading
554 */
555
556 static int
557 read_message_data(FILE *fout)
558 {
559 int ch_state;
560 register int ch;
561 register int linelength = 0;
562
563 /* Handle the case when only EOF terminates the message */
564
565 if (!dot_ends)
566 {
567 register int last_ch = '\n';
568
569 for (; (ch = (receive_getc)()) != EOF; last_ch = ch)
570 {
571 if (ch == 0) body_zerocount++;
572 if (last_ch == '\r' && ch != '\n')
573 {
574 if (linelength > max_received_linelength)
575 max_received_linelength = linelength;
576 linelength = 0;
577 if (fputc('\n', fout) == EOF) return END_WERROR;
578 message_size++;
579 body_linecount++;
580 }
581 if (ch == '\r') continue;
582
583 if (fputc(ch, fout) == EOF) return END_WERROR;
584 if (ch == '\n')
585 {
586 if (linelength > max_received_linelength)
587 max_received_linelength = linelength;
588 linelength = 0;
589 body_linecount++;
590 }
591 else linelength++;
592 if (++message_size > thismessage_size_limit) return END_SIZE;
593 }
594
595 if (last_ch != '\n')
596 {
597 if (linelength > max_received_linelength)
598 max_received_linelength = linelength;
599 if (fputc('\n', fout) == EOF) return END_WERROR;
600 message_size++;
601 body_linecount++;
602 }
603
604 return END_EOF;
605 }
606
607 /* Handle the case when a dot on a line on its own, or EOF, terminates. */
608
609 ch_state = 1;
610
611 while ((ch = (receive_getc)()) != EOF)
612 {
613 if (ch == 0) body_zerocount++;
614 switch (ch_state)
615 {
616 case 0: /* Normal state (previous char written) */
617 if (ch == '\n')
618 {
619 body_linecount++;
620 if (linelength > max_received_linelength)
621 max_received_linelength = linelength;
622 linelength = -1;
623 ch_state = 1;
624 }
625 else if (ch == '\r')
626 { ch_state = 2; continue; }
627 break;
628
629 case 1: /* After written "\n" */
630 if (ch == '.') { ch_state = 3; continue; }
631 if (ch != '\n') ch_state = 0; else linelength = -1;
632 break;
633
634 case 2:
635 body_linecount++; /* After unwritten "\r" */
636 if (linelength > max_received_linelength)
637 max_received_linelength = linelength;
638 if (ch == '\n')
639 {
640 ch_state = 1;
641 linelength = -1;
642 }
643 else
644 {
645 if (message_size++, fputc('\n', fout) == EOF) return END_WERROR;
646 if (ch == '\r') continue;
647 ch_state = 0;
648 linelength = 0;
649 }
650 break;
651
652 case 3: /* After "\n." (\n written, dot not) */
653 if (ch == '\n') return END_DOT;
654 if (ch == '\r') { ch_state = 4; continue; }
655 message_size++;
656 linelength++;
657 if (fputc('.', fout) == EOF) return END_WERROR;
658 ch_state = 0;
659 break;
660
661 case 4: /* After "\n.\r" (\n written, rest not) */
662 if (ch == '\n') return END_DOT;
663 message_size += 2;
664 body_linecount++;
665 if (fputs(".\n", fout) == EOF) return END_WERROR;
666 if (ch == '\r') { ch_state = 2; continue; }
667 ch_state = 0;
668 break;
669 }
670
671 linelength++;
672 if (fputc(ch, fout) == EOF) return END_WERROR;
673 if (++message_size > thismessage_size_limit) return END_SIZE;
674 }
675
676 /* Get here if EOF read. Unless we have just written "\n", we need to ensure
677 the message ends with a newline, and we must also write any characters that
678 were saved up while testing for an ending dot. */
679
680 if (ch_state != 1)
681 {
682 static uschar *ends[] = { US"\n", NULL, US"\n", US".\n", US".\n" };
683 if (fputs(CS ends[ch_state], fout) == EOF) return END_WERROR;
684 message_size += Ustrlen(ends[ch_state]);
685 body_linecount++;
686 }
687
688 return END_EOF;
689 }
690
691
692
693
694 /*************************************************
695 * Read data portion of an SMTP message *
696 *************************************************/
697
698 /* This function is called to read the remainder of an SMTP message (after the
699 headers), or to skip over it when an error has occurred. In this case, the
700 output file is passed as NULL.
701
702 If any line begins with a dot, that character is skipped. The input should only
703 be successfully terminated by CR LF . CR LF unless it is local (non-network)
704 SMTP, in which case the CRs are optional, but...
705
706 FUDGE: It seems that sites on the net send out messages with just LF
707 terminators, despite the warnings in the RFCs, and other MTAs handle this. So
708 we make the CRs optional in all cases.
709
710 July 2003: Bare CRs cause trouble. We now treat them as line terminators as
711 well, so that there are no CRs in spooled messages. However, the message
712 terminating dot is not recognized between two bare CRs.
713
714 Arguments:
715 fout a FILE to which to write the message; NULL if skipping
716
717 Returns: One of the END_xxx values indicating why it stopped reading
718 */
719
720 static int
721 read_message_data_smtp(FILE *fout)
722 {
723 int ch_state = 0;
724 int ch;
725 register int linelength = 0;
726
727 while ((ch = (receive_getc)()) != EOF)
728 {
729 if (ch == 0) body_zerocount++;
730 switch (ch_state)
731 {
732 case 0: /* After LF or CRLF */
733 if (ch == '.')
734 {
735 ch_state = 3;
736 continue; /* Don't ever write . after LF */
737 }
738 ch_state = 1;
739
740 /* Else fall through to handle as normal uschar. */
741
742 case 1: /* Normal state */
743 if (ch == '\n')
744 {
745 ch_state = 0;
746 body_linecount++;
747 if (linelength > max_received_linelength)
748 max_received_linelength = linelength;
749 linelength = -1;
750 }
751 else if (ch == '\r')
752 {
753 ch_state = 2;
754 continue;
755 }
756 break;
757
758 case 2: /* After (unwritten) CR */
759 body_linecount++;
760 if (linelength > max_received_linelength)
761 max_received_linelength = linelength;
762 linelength = -1;
763 if (ch == '\n')
764 {
765 ch_state = 0;
766 }
767 else
768 {
769 message_size++;
770 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
771 (void) cutthrough_put_nl();
772 if (ch != '\r') ch_state = 1; else continue;
773 }
774 break;
775
776 case 3: /* After [CR] LF . */
777 if (ch == '\n')
778 return END_DOT;
779 if (ch == '\r')
780 {
781 ch_state = 4;
782 continue;
783 }
784 ch_state = 1; /* The dot itself is removed */
785 break;
786
787 case 4: /* After [CR] LF . CR */
788 if (ch == '\n') return END_DOT;
789 message_size++;
790 body_linecount++;
791 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
792 (void) cutthrough_put_nl();
793 if (ch == '\r')
794 {
795 ch_state = 2;
796 continue;
797 }
798 ch_state = 1;
799 break;
800 }
801
802 /* Add the character to the spool file, unless skipping; then loop for the
803 next. */
804
805 message_size++;
806 linelength++;
807 if (fout != NULL)
808 {
809 if (fputc(ch, fout) == EOF) return END_WERROR;
810 if (message_size > thismessage_size_limit) return END_SIZE;
811 }
812 if(ch == '\n')
813 (void) cutthrough_put_nl();
814 else
815 {
816 uschar c= ch;
817 (void) cutthrough_puts(&c, 1);
818 }
819 }
820
821 /* Fall through here if EOF encountered. This indicates some kind of error,
822 since a correct message is terminated by [CR] LF . [CR] LF. */
823
824 return END_EOF;
825 }
826
827
828
829
830 /*************************************************
831 * Swallow SMTP message *
832 *************************************************/
833
834 /* This function is called when there has been some kind of error while reading
835 an SMTP message, and the remaining data may need to be swallowed. It is global
836 because it is called from smtp_closedown() to shut down an incoming call
837 tidily.
838
839 Argument: a FILE from which to read the message
840 Returns: nothing
841 */
842
843 void
844 receive_swallow_smtp(void)
845 {
846 if (message_ended >= END_NOTENDED)
847 message_ended = read_message_data_smtp(NULL);
848 }
849
850
851
852 /*************************************************
853 * Handle lost SMTP connection *
854 *************************************************/
855
856 /* This function logs connection loss incidents and generates an appropriate
857 SMTP response.
858
859 Argument: additional data for the message
860 Returns: the SMTP response
861 */
862
863 static uschar *
864 handle_lost_connection(uschar *s)
865 {
866 log_write(L_lost_incoming_connection | L_smtp_connection, LOG_MAIN,
867 "%s lost while reading message data%s", smtp_get_connection_info(), s);
868 return US"421 Lost incoming connection";
869 }
870
871
872
873
874 /*************************************************
875 * Handle a non-smtp reception error *
876 *************************************************/
877
878 /* This function is called for various errors during the reception of non-SMTP
879 messages. It either sends a message to the sender of the problem message, or it
880 writes to the standard error stream.
881
882 Arguments:
883 errcode code for moan_to_sender(), identifying the error
884 text1 first message text, passed to moan_to_sender()
885 text2 second message text, used only for stderrr
886 error_rc code to pass to exim_exit if no problem
887 f FILE containing body of message (may be stdin)
888 hptr pointer to instore headers or NULL
889
890 Returns: calls exim_exit(), which does not return
891 */
892
893 static void
894 give_local_error(int errcode, uschar *text1, uschar *text2, int error_rc,
895 FILE *f, header_line *hptr)
896 {
897 if (error_handling == ERRORS_SENDER)
898 {
899 error_block eblock;
900 eblock.next = NULL;
901 eblock.text1 = text1;
902 if (!moan_to_sender(errcode, &eblock, hptr, f, FALSE))
903 error_rc = EXIT_FAILURE;
904 }
905 else fprintf(stderr, "exim: %s%s\n", text2, text1); /* Sic */
906 (void)fclose(f);
907 exim_exit(error_rc);
908 }
909
910
911
912 /*************************************************
913 * Add header lines set up by ACL *
914 *************************************************/
915
916 /* This function is called to add the header lines that were set up by
917 statements in an ACL to the list of headers in memory. It is done in two stages
918 like this, because when the ACL for RCPT is running, the other headers have not
919 yet been received. This function is called twice; once just before running the
920 DATA ACL, and once after. This is so that header lines added by MAIL or RCPT
921 are visible to the DATA ACL.
922
923 Originally these header lines were added at the end. Now there is support for
924 three different places: top, bottom, and after the Received: header(s). There
925 will always be at least one Received: header, even if it is marked deleted, and
926 even if something else has been put in front of it.
927
928 Arguments:
929 acl_name text to identify which ACL
930
931 Returns: nothing
932 */
933
934 static void
935 add_acl_headers(uschar *acl_name)
936 {
937 header_line *h, *next;
938 header_line *last_received = NULL;
939
940 if (acl_added_headers == NULL) return;
941 DEBUG(D_receive|D_acl) debug_printf(">>Headers added by %s ACL:\n", acl_name);
942
943 for (h = acl_added_headers; h != NULL; h = next)
944 {
945 next = h->next;
946
947 switch(h->type)
948 {
949 case htype_add_top:
950 h->next = header_list;
951 header_list = h;
952 DEBUG(D_receive|D_acl) debug_printf(" (at top)");
953 break;
954
955 case htype_add_rec:
956 if (last_received == NULL)
957 {
958 last_received = header_list;
959 while (!header_testname(last_received, US"Received", 8, FALSE))
960 last_received = last_received->next;
961 while (last_received->next != NULL &&
962 header_testname(last_received->next, US"Received", 8, FALSE))
963 last_received = last_received->next;
964 }
965 h->next = last_received->next;
966 last_received->next = h;
967 DEBUG(D_receive|D_acl) debug_printf(" (after Received:)");
968 break;
969
970 case htype_add_rfc:
971 /* add header before any header which is NOT Received: or Resent- */
972 last_received = header_list;
973 while ( (last_received->next != NULL) &&
974 ( (header_testname(last_received->next, US"Received", 8, FALSE)) ||
975 (header_testname_incomplete(last_received->next, US"Resent-", 7, FALSE)) ) )
976 last_received = last_received->next;
977 /* last_received now points to the last Received: or Resent-* header
978 in an uninterrupted chain of those header types (seen from the beginning
979 of all headers. Our current header must follow it. */
980 h->next = last_received->next;
981 last_received->next = h;
982 DEBUG(D_receive|D_acl) debug_printf(" (before any non-Received: or Resent-*: header)");
983 break;
984
985 default:
986 h->next = NULL;
987 header_last->next = h;
988 break;
989 }
990
991 if (h->next == NULL) header_last = h;
992
993 /* Check for one of the known header types (From:, To:, etc.) though in
994 practice most added headers are going to be "other". Lower case
995 identification letters are never stored with the header; they are used
996 for existence tests when messages are received. So discard any lower case
997 flag values. */
998
999 h->type = header_checkname(h, FALSE);
1000 if (h->type >= 'a') h->type = htype_other;
1001
1002 DEBUG(D_receive|D_acl) debug_printf(" %s", header_last->text);
1003 }
1004
1005 acl_added_headers = NULL;
1006 DEBUG(D_receive|D_acl) debug_printf(">>\n");
1007 }
1008
1009
1010
1011 /*************************************************
1012 * Add host information for log line *
1013 *************************************************/
1014
1015 /* Called for acceptance and rejecting log lines. This adds information about
1016 the calling host to a string that is being built dynamically.
1017
1018 Arguments:
1019 s the dynamic string
1020 sizeptr points to the size variable
1021 ptrptr points to the pointer variable
1022
1023 Returns: the extended string
1024 */
1025
1026 static uschar *
1027 add_host_info_for_log(uschar *s, int *sizeptr, int *ptrptr)
1028 {
1029 if (sender_fullhost != NULL)
1030 {
1031 s = string_append(s, sizeptr, ptrptr, 2, US" H=", sender_fullhost);
1032 if ((log_extra_selector & LX_incoming_interface) != 0 &&
1033 interface_address != NULL)
1034 {
1035 uschar *ss = string_sprintf(" I=[%s]:%d", interface_address,
1036 interface_port);
1037 s = string_cat(s, sizeptr, ptrptr, ss, Ustrlen(ss));
1038 }
1039 }
1040 if (sender_ident != NULL)
1041 s = string_append(s, sizeptr, ptrptr, 2, US" U=", sender_ident);
1042 if (received_protocol != NULL)
1043 s = string_append(s, sizeptr, ptrptr, 2, US" P=", received_protocol);
1044 return s;
1045 }
1046
1047
1048
1049 #ifdef WITH_CONTENT_SCAN
1050
1051 /*************************************************
1052 * Run the MIME ACL on a message *
1053 *************************************************/
1054
1055 /* This code is in a subroutine so that it can be used for both SMTP
1056 and non-SMTP messages. It is called with a non-NULL ACL pointer.
1057
1058 Arguments:
1059 acl The ACL to run (acl_smtp_mime or acl_not_smtp_mime)
1060 smtp_yield_ptr Set FALSE to kill messages after dropped connection
1061 smtp_reply_ptr Where SMTP reply is being built
1062 blackholed_by_ptr Where "blackholed by" message is being built
1063
1064 Returns: TRUE to carry on; FALSE to abandon the message
1065 */
1066
1067 static BOOL
1068 run_mime_acl(uschar *acl, BOOL *smtp_yield_ptr, uschar **smtp_reply_ptr,
1069 uschar **blackholed_by_ptr)
1070 {
1071 FILE *mbox_file;
1072 uschar rfc822_file_path[2048];
1073 unsigned long mbox_size;
1074 header_line *my_headerlist;
1075 uschar *user_msg, *log_msg;
1076 int mime_part_count_buffer = -1;
1077 int rc = OK;
1078
1079 memset(CS rfc822_file_path,0,2048);
1080
1081 /* check if it is a MIME message */
1082 my_headerlist = header_list;
1083 while (my_headerlist != NULL)
1084 {
1085 /* skip deleted headers */
1086 if (my_headerlist->type == '*')
1087 {
1088 my_headerlist = my_headerlist->next;
1089 continue;
1090 }
1091 if (strncmpic(my_headerlist->text, US"Content-Type:", 13) == 0)
1092 {
1093 DEBUG(D_receive) debug_printf("Found Content-Type: header - executing acl_smtp_mime.\n");
1094 goto DO_MIME_ACL;
1095 }
1096 my_headerlist = my_headerlist->next;
1097 }
1098
1099 DEBUG(D_receive) debug_printf("No Content-Type: header - presumably not a MIME message.\n");
1100 return TRUE;
1101
1102 DO_MIME_ACL:
1103 /* make sure the eml mbox file is spooled up */
1104 mbox_file = spool_mbox(&mbox_size, NULL);
1105 if (mbox_file == NULL) {
1106 /* error while spooling */
1107 log_write(0, LOG_MAIN|LOG_PANIC,
1108 "acl_smtp_mime: error while creating mbox spool file, message temporarily rejected.");
1109 Uunlink(spool_name);
1110 unspool_mbox();
1111 #ifdef EXPERIMENTAL_DCC
1112 dcc_ok = 0;
1113 #endif
1114 smtp_respond(US"451", 3, TRUE, US"temporary local problem");
1115 message_id[0] = 0; /* Indicate no message accepted */
1116 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1117 return FALSE; /* Indicate skip to end of receive function */
1118 };
1119
1120 mime_is_rfc822 = 0;
1121
1122 MIME_ACL_CHECK:
1123 mime_part_count = -1;
1124 rc = mime_acl_check(acl, mbox_file, NULL, &user_msg, &log_msg);
1125 (void)fclose(mbox_file);
1126
1127 if (Ustrlen(rfc822_file_path) > 0)
1128 {
1129 mime_part_count = mime_part_count_buffer;
1130
1131 if (unlink(CS rfc822_file_path) == -1)
1132 {
1133 log_write(0, LOG_PANIC,
1134 "acl_smtp_mime: can't unlink RFC822 spool file, skipping.");
1135 goto END_MIME_ACL;
1136 }
1137 }
1138
1139 /* check if we must check any message/rfc822 attachments */
1140 if (rc == OK)
1141 {
1142 uschar temp_path[1024];
1143 int n;
1144 struct dirent *entry;
1145 DIR *tempdir;
1146
1147 (void)string_format(temp_path, 1024, "%s/scan/%s", spool_directory,
1148 message_id);
1149
1150 tempdir = opendir(CS temp_path);
1151 n = 0;
1152 do
1153 {
1154 entry = readdir(tempdir);
1155 if (entry == NULL) break;
1156 if (strncmpic(US entry->d_name,US"__rfc822_",9) == 0)
1157 {
1158 (void)string_format(rfc822_file_path, 2048,"%s/scan/%s/%s", spool_directory, message_id, entry->d_name);
1159 debug_printf("RFC822 attachment detected: running MIME ACL for '%s'\n", rfc822_file_path);
1160 break;
1161 }
1162 } while (1);
1163 closedir(tempdir);
1164
1165 if (entry != NULL)
1166 {
1167 mbox_file = Ufopen(rfc822_file_path,"rb");
1168 if (mbox_file == NULL)
1169 {
1170 log_write(0, LOG_PANIC,
1171 "acl_smtp_mime: can't open RFC822 spool file, skipping.");
1172 unlink(CS rfc822_file_path);
1173 goto END_MIME_ACL;
1174 }
1175 /* set RFC822 expansion variable */
1176 mime_is_rfc822 = 1;
1177 mime_part_count_buffer = mime_part_count;
1178 goto MIME_ACL_CHECK;
1179 }
1180 }
1181
1182 END_MIME_ACL:
1183 add_acl_headers(US"MIME");
1184 if (rc == DISCARD)
1185 {
1186 recipients_count = 0;
1187 *blackholed_by_ptr = US"MIME ACL";
1188 }
1189 else if (rc != OK)
1190 {
1191 Uunlink(spool_name);
1192 unspool_mbox();
1193 #ifdef EXPERIMENTAL_DCC
1194 dcc_ok = 0;
1195 #endif
1196 if (smtp_handle_acl_fail(ACL_WHERE_MIME, rc, user_msg, log_msg) != 0)
1197 *smtp_yield_ptr = FALSE; /* No more messsages after dropped connection */
1198 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1199 message_id[0] = 0; /* Indicate no message accepted */
1200 return FALSE; /* Cause skip to end of receive function */
1201 }
1202
1203 return TRUE;
1204 }
1205
1206 #endif /* WITH_CONTENT_SCAN */
1207
1208
1209
1210 void
1211 received_header_gen(void)
1212 {
1213 uschar *received;
1214 uschar *timestamp;
1215 header_line *received_header= header_list;
1216
1217 timestamp = expand_string(US"${tod_full}");
1218 if (recipients_count == 1) received_for = recipients_list[0].address;
1219 received = expand_string(received_header_text);
1220 received_for = NULL;
1221
1222 if (received == NULL)
1223 {
1224 if(spool_name[0] != 0)
1225 Uunlink(spool_name); /* Lose the data file */
1226 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Expansion of \"%s\" "
1227 "(received_header_text) failed: %s", string_printing(received_header_text),
1228 expand_string_message);
1229 }
1230
1231 /* The first element on the header chain is reserved for the Received header,
1232 so all we have to do is fill in the text pointer, and set the type. However, if
1233 the result of the expansion is an empty string, we leave the header marked as
1234 "old" so as to refrain from adding a Received header. */
1235
1236 if (received[0] == 0)
1237 {
1238 received_header->text = string_sprintf("Received: ; %s\n", timestamp);
1239 received_header->type = htype_old;
1240 }
1241 else
1242 {
1243 received_header->text = string_sprintf("%s; %s\n", received, timestamp);
1244 received_header->type = htype_received;
1245 }
1246
1247 received_header->slen = Ustrlen(received_header->text);
1248
1249 DEBUG(D_receive) debug_printf(">>Generated Received: header line\n%c %s",
1250 received_header->type, received_header->text);
1251 }
1252
1253
1254
1255 /*************************************************
1256 * Receive message *
1257 *************************************************/
1258
1259 /* Receive a message on the given input, and put it into a pair of spool files.
1260 Either a non-null list of recipients, or the extract flag will be true, or
1261 both. The flag sender_local is true for locally generated messages. The flag
1262 submission_mode is true if an ACL has obeyed "control = submission". The flag
1263 suppress_local_fixups is true if an ACL has obeyed "control =
1264 suppress_local_fixups" or -G was passed on the command-line.
1265 The flag smtp_input is true if the message is to be
1266 handled using SMTP conventions about termination and lines starting with dots.
1267 For non-SMTP messages, dot_ends is true for dot-terminated messages.
1268
1269 If a message was successfully read, message_id[0] will be non-zero.
1270
1271 The general actions of this function are:
1272
1273 . Read the headers of the message (if any) into a chain of store
1274 blocks.
1275
1276 . If there is a "sender:" header and the message is locally originated,
1277 throw it away, unless the caller is trusted, or unless
1278 active_local_sender_retain is set - which can only happen if
1279 active_local_from_check is false.
1280
1281 . If recipients are to be extracted from the message, build the
1282 recipients list from the headers, removing any that were on the
1283 original recipients list (unless extract_addresses_remove_arguments is
1284 false), and at the same time, remove any bcc header that may be present.
1285
1286 . Get the spool file for the data, sort out its unique name, open
1287 and lock it (but don't give it the name yet).
1288
1289 . Generate a "Message-Id" header if the message doesn't have one, for
1290 locally-originated messages.
1291
1292 . Generate a "Received" header.
1293
1294 . Ensure the recipients list is fully qualified and rewritten if necessary.
1295
1296 . If there are any rewriting rules, apply them to the sender address
1297 and also to the headers.
1298
1299 . If there is no from: header, generate one, for locally-generated messages
1300 and messages in "submission mode" only.
1301
1302 . If the sender is local, check that from: is correct, and if not, generate
1303 a Sender: header, unless message comes from a trusted caller, or this
1304 feature is disabled by active_local_from_check being false.
1305
1306 . If there is no "date" header, generate one, for locally-originated
1307 or submission mode messages only.
1308
1309 . Copy the rest of the input, or up to a terminating "." if in SMTP or
1310 dot_ends mode, to the data file. Leave it open, to hold the lock.
1311
1312 . Write the envelope and the headers to a new file.
1313
1314 . Set the name for the header file; close it.
1315
1316 . Set the name for the data file; close it.
1317
1318 Because this function can potentially be called many times in a single
1319 SMTP connection, all store should be got by store_get(), so that it will be
1320 automatically retrieved after the message is accepted.
1321
1322 FUDGE: It seems that sites on the net send out messages with just LF
1323 terminators, despite the warnings in the RFCs, and other MTAs handle this. So
1324 we make the CRs optional in all cases.
1325
1326 July 2003: Bare CRs in messages, especially in header lines, cause trouble. A
1327 new regime is now in place in which bare CRs in header lines are turned into LF
1328 followed by a space, so as not to terminate the header line.
1329
1330 February 2004: A bare LF in a header line in a message whose first line was
1331 terminated by CRLF is treated in the same way as a bare CR.
1332
1333 Arguments:
1334 extract_recip TRUE if recipients are to be extracted from the message's
1335 headers
1336
1337 Returns: TRUE there are more messages to be read (SMTP input)
1338 FALSE there are no more messages to be read (non-SMTP input
1339 or SMTP connection collapsed, or other failure)
1340
1341 When reading a message for filter testing, the returned value indicates
1342 whether the headers (which is all that is read) were terminated by '.' or
1343 not. */
1344
1345 BOOL
1346 receive_msg(BOOL extract_recip)
1347 {
1348 int i;
1349 int rc = FAIL;
1350 int msg_size = 0;
1351 int process_info_len = Ustrlen(process_info);
1352 int error_rc = (error_handling == ERRORS_SENDER)?
1353 errors_sender_rc : EXIT_FAILURE;
1354 int header_size = 256;
1355 int start, end, domain, size, sptr;
1356 int id_resolution;
1357 int had_zero = 0;
1358 int prevlines_length = 0;
1359
1360 register int ptr = 0;
1361
1362 BOOL contains_resent_headers = FALSE;
1363 BOOL extracted_ignored = FALSE;
1364 BOOL first_line_ended_crlf = TRUE_UNSET;
1365 BOOL smtp_yield = TRUE;
1366 BOOL yield = FALSE;
1367
1368 BOOL resents_exist = FALSE;
1369 uschar *resent_prefix = US"";
1370 uschar *blackholed_by = NULL;
1371 uschar *blackhole_log_msg = US"";
1372 int cutthrough_done;
1373
1374 flock_t lock_data;
1375 error_block *bad_addresses = NULL;
1376
1377 uschar *frozen_by = NULL;
1378 uschar *queued_by = NULL;
1379
1380 uschar *errmsg, *s;
1381 struct stat statbuf;
1382
1383 /* Final message to give to SMTP caller, and messages from ACLs */
1384
1385 uschar *smtp_reply = NULL;
1386 uschar *user_msg, *log_msg;
1387
1388 /* Working header pointers */
1389
1390 header_line *h, *next;
1391
1392 /* Flags for noting the existence of certain headers (only one left) */
1393
1394 BOOL date_header_exists = FALSE;
1395
1396 /* Pointers to receive the addresses of headers whose contents we need. */
1397
1398 header_line *from_header = NULL;
1399 header_line *subject_header = NULL;
1400 header_line *msgid_header = NULL;
1401 header_line *received_header;
1402
1403 /* Variables for use when building the Received: header. */
1404
1405 uschar *timestamp;
1406 int tslen;
1407
1408 /* Release any open files that might have been cached while preparing to
1409 accept the message - e.g. by verifying addresses - because reading a message
1410 might take a fair bit of real time. */
1411
1412 search_tidyup();
1413
1414 /* Extracting the recipient list from an input file is incompatible with
1415 cutthrough delivery with the no-spool option. It shouldn't be possible
1416 to set up the combination, but just in case kill any ongoing connection. */
1417 if (extract_recip || !smtp_input)
1418 cancel_cutthrough_connection();
1419
1420 /* Initialize the chain of headers by setting up a place-holder for Received:
1421 header. Temporarily mark it as "old", i.e. not to be used. We keep header_last
1422 pointing to the end of the chain to make adding headers simple. */
1423
1424 received_header = header_list = header_last = store_get(sizeof(header_line));
1425 header_list->next = NULL;
1426 header_list->type = htype_old;
1427 header_list->text = NULL;
1428 header_list->slen = 0;
1429
1430 /* Control block for the next header to be read. */
1431
1432 next = store_get(sizeof(header_line));
1433 next->text = store_get(header_size);
1434
1435 /* Initialize message id to be null (indicating no message read), and the
1436 header names list to be the normal list. Indicate there is no data file open
1437 yet, initialize the size and warning count, and deal with no size limit. */
1438
1439 message_id[0] = 0;
1440 data_file = NULL;
1441 data_fd = -1;
1442 spool_name[0] = 0;
1443 message_size = 0;
1444 warning_count = 0;
1445 received_count = 1; /* For the one we will add */
1446
1447 if (thismessage_size_limit <= 0) thismessage_size_limit = INT_MAX;
1448
1449 /* While reading the message, the following counts are computed. */
1450
1451 message_linecount = body_linecount = body_zerocount =
1452 max_received_linelength = 0;
1453
1454 #ifndef DISABLE_DKIM
1455 /* Call into DKIM to set up the context. */
1456 if (smtp_input && !smtp_batched_input && !dkim_disable_verify) dkim_exim_verify_init();
1457 #endif
1458
1459 /* Remember the time of reception. Exim uses time+pid for uniqueness of message
1460 ids, and fractions of a second are required. See the comments that precede the
1461 message id creation below. */
1462
1463 (void)gettimeofday(&message_id_tv, NULL);
1464
1465 /* For other uses of the received time we can operate with granularity of one
1466 second, and for that we use the global variable received_time. This is for
1467 things like ultimate message timeouts. */
1468
1469 received_time = message_id_tv.tv_sec;
1470
1471 /* If SMTP input, set the special handler for timeouts. The alarm() calls
1472 happen in the smtp_getc() function when it refills its buffer. */
1473
1474 if (smtp_input) os_non_restarting_signal(SIGALRM, data_timeout_handler);
1475
1476 /* If not SMTP input, timeout happens only if configured, and we just set a
1477 single timeout for the whole message. */
1478
1479 else if (receive_timeout > 0)
1480 {
1481 os_non_restarting_signal(SIGALRM, data_timeout_handler);
1482 alarm(receive_timeout);
1483 }
1484
1485 /* SIGTERM and SIGINT are caught always. */
1486
1487 signal(SIGTERM, data_sigterm_sigint_handler);
1488 signal(SIGINT, data_sigterm_sigint_handler);
1489
1490 /* Header lines in messages are not supposed to be very long, though when
1491 unfolded, to: and cc: headers can take up a lot of store. We must also cope
1492 with the possibility of junk being thrown at us. Start by getting 256 bytes for
1493 storing the header, and extend this as necessary using string_cat().
1494
1495 To cope with total lunacies, impose an upper limit on the length of the header
1496 section of the message, as otherwise the store will fill up. We must also cope
1497 with the possibility of binary zeros in the data. Hence we cannot use fgets().
1498 Folded header lines are joined into one string, leaving the '\n' characters
1499 inside them, so that writing them out reproduces the input.
1500
1501 Loop for each character of each header; the next structure for chaining the
1502 header is set up already, with ptr the offset of the next character in
1503 next->text. */
1504
1505 for (;;)
1506 {
1507 int ch = (receive_getc)();
1508
1509 /* If we hit EOF on a SMTP connection, it's an error, since incoming
1510 SMTP must have a correct "." terminator. */
1511
1512 if (ch == EOF && smtp_input /* && !smtp_batched_input */)
1513 {
1514 smtp_reply = handle_lost_connection(US" (header)");
1515 smtp_yield = FALSE;
1516 goto TIDYUP; /* Skip to end of function */
1517 }
1518
1519 /* See if we are at the current header's size limit - there must be at least
1520 four bytes left. This allows for the new character plus a zero, plus two for
1521 extra insertions when we are playing games with dots and carriage returns. If
1522 we are at the limit, extend the text buffer. This could have been done
1523 automatically using string_cat() but because this is a tightish loop storing
1524 only one character at a time, we choose to do it inline. Normally
1525 store_extend() will be able to extend the block; only at the end of a big
1526 store block will a copy be needed. To handle the case of very long headers
1527 (and sometimes lunatic messages can have ones that are 100s of K long) we
1528 call store_release() for strings that have been copied - if the string is at
1529 the start of a block (and therefore the only thing in it, because we aren't
1530 doing any other gets), the block gets freed. We can only do this because we
1531 know there are no other calls to store_get() going on. */
1532
1533 if (ptr >= header_size - 4)
1534 {
1535 int oldsize = header_size;
1536 /* header_size += 256; */
1537 header_size *= 2;
1538 if (!store_extend(next->text, oldsize, header_size))
1539 {
1540 uschar *newtext = store_get(header_size);
1541 memcpy(newtext, next->text, ptr);
1542 store_release(next->text);
1543 next->text = newtext;
1544 }
1545 }
1546
1547 /* Cope with receiving a binary zero. There is dispute about whether
1548 these should be allowed in RFC 822 messages. The middle view is that they
1549 should not be allowed in headers, at least. Exim takes this attitude at
1550 the moment. We can't just stomp on them here, because we don't know that
1551 this line is a header yet. Set a flag to cause scanning later. */
1552
1553 if (ch == 0) had_zero++;
1554
1555 /* Test for termination. Lines in remote SMTP are terminated by CRLF, while
1556 those from data files use just LF. Treat LF in local SMTP input as a
1557 terminator too. Treat EOF as a line terminator always. */
1558
1559 if (ch == EOF) goto EOL;
1560
1561 /* FUDGE: There are sites out there that don't send CRs before their LFs, and
1562 other MTAs accept this. We are therefore forced into this "liberalisation"
1563 too, so we accept LF as a line terminator whatever the source of the message.
1564 However, if the first line of the message ended with a CRLF, we treat a bare
1565 LF specially by inserting a white space after it to ensure that the header
1566 line is not terminated. */
1567
1568 if (ch == '\n')
1569 {
1570 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = FALSE;
1571 else if (first_line_ended_crlf) receive_ungetc(' ');
1572 goto EOL;
1573 }
1574
1575 /* This is not the end of the line. If this is SMTP input and this is
1576 the first character in the line and it is a "." character, ignore it.
1577 This implements the dot-doubling rule, though header lines starting with
1578 dots aren't exactly common. They are legal in RFC 822, though. If the
1579 following is CRLF or LF, this is the line that that terminates the
1580 entire message. We set message_ended to indicate this has happened (to
1581 prevent further reading), and break out of the loop, having freed the
1582 empty header, and set next = NULL to indicate no data line. */
1583
1584 if (ptr == 0 && ch == '.' && (smtp_input || dot_ends))
1585 {
1586 ch = (receive_getc)();
1587 if (ch == '\r')
1588 {
1589 ch = (receive_getc)();
1590 if (ch != '\n')
1591 {
1592 receive_ungetc(ch);
1593 ch = '\r'; /* Revert to CR */
1594 }
1595 }
1596 if (ch == '\n')
1597 {
1598 message_ended = END_DOT;
1599 store_reset(next);
1600 next = NULL;
1601 break; /* End character-reading loop */
1602 }
1603
1604 /* For non-SMTP input, the dot at the start of the line was really a data
1605 character. What is now in ch is the following character. We guaranteed
1606 enough space for this above. */
1607
1608 if (!smtp_input)
1609 {
1610 next->text[ptr++] = '.';
1611 message_size++;
1612 }
1613 }
1614
1615 /* If CR is immediately followed by LF, end the line, ignoring the CR, and
1616 remember this case if this is the first line ending. */
1617
1618 if (ch == '\r')
1619 {
1620 ch = (receive_getc)();
1621 if (ch == '\n')
1622 {
1623 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = TRUE;
1624 goto EOL;
1625 }
1626
1627 /* Otherwise, put back the character after CR, and turn the bare CR
1628 into LF SP. */
1629
1630 ch = (receive_ungetc)(ch);
1631 next->text[ptr++] = '\n';
1632 message_size++;
1633 ch = ' ';
1634 }
1635
1636 /* We have a data character for the header line. */
1637
1638 next->text[ptr++] = ch; /* Add to buffer */
1639 message_size++; /* Total message size so far */
1640
1641 /* Handle failure due to a humungously long header section. The >= allows
1642 for the terminating \n. Add what we have so far onto the headers list so
1643 that it gets reflected in any error message, and back up the just-read
1644 character. */
1645
1646 if (message_size >= header_maxsize)
1647 {
1648 next->text[ptr] = 0;
1649 next->slen = ptr;
1650 next->type = htype_other;
1651 next->next = NULL;
1652 header_last->next = next;
1653 header_last = next;
1654
1655 log_write(0, LOG_MAIN, "ridiculously long message header received from "
1656 "%s (more than %d characters): message abandoned",
1657 sender_host_unknown? sender_ident : sender_fullhost, header_maxsize);
1658
1659 if (smtp_input)
1660 {
1661 smtp_reply = US"552 Message header is ridiculously long";
1662 receive_swallow_smtp();
1663 goto TIDYUP; /* Skip to end of function */
1664 }
1665
1666 else
1667 {
1668 give_local_error(ERRMESS_VLONGHEADER,
1669 string_sprintf("message header longer than %d characters received: "
1670 "message not accepted", header_maxsize), US"", error_rc, stdin,
1671 header_list->next);
1672 /* Does not return */
1673 }
1674 }
1675
1676 continue; /* With next input character */
1677
1678 /* End of header line reached */
1679
1680 EOL:
1681
1682 /* Keep track of lines for BSMTP errors and overall message_linecount. */
1683
1684 receive_linecount++;
1685 message_linecount++;
1686
1687 /* Keep track of maximum line length */
1688
1689 if (ptr - prevlines_length > max_received_linelength)
1690 max_received_linelength = ptr - prevlines_length;
1691 prevlines_length = ptr + 1;
1692
1693 /* Now put in the terminating newline. There is always space for
1694 at least two more characters. */
1695
1696 next->text[ptr++] = '\n';
1697 message_size++;
1698
1699 /* A blank line signals the end of the headers; release the unwanted
1700 space and set next to NULL to indicate this. */
1701
1702 if (ptr == 1)
1703 {
1704 store_reset(next);
1705 next = NULL;
1706 break;
1707 }
1708
1709 /* There is data in the line; see if the next input character is a
1710 whitespace character. If it is, we have a continuation of this header line.
1711 There is always space for at least one character at this point. */
1712
1713 if (ch != EOF)
1714 {
1715 int nextch = (receive_getc)();
1716 if (nextch == ' ' || nextch == '\t')
1717 {
1718 next->text[ptr++] = nextch;
1719 message_size++;
1720 continue; /* Iterate the loop */
1721 }
1722 else if (nextch != EOF) (receive_ungetc)(nextch); /* For next time */
1723 else ch = EOF; /* Cause main loop to exit at end */
1724 }
1725
1726 /* We have got to the real line end. Terminate the string and release store
1727 beyond it. If it turns out to be a real header, internal binary zeros will
1728 be squashed later. */
1729
1730 next->text[ptr] = 0;
1731 next->slen = ptr;
1732 store_reset(next->text + ptr + 1);
1733
1734 /* Check the running total size against the overall message size limit. We
1735 don't expect to fail here, but if the overall limit is set less than MESSAGE_
1736 MAXSIZE and a big header is sent, we want to catch it. Just stop reading
1737 headers - the code to read the body will then also hit the buffer. */
1738
1739 if (message_size > thismessage_size_limit) break;
1740
1741 /* A line that is not syntactically correct for a header also marks
1742 the end of the headers. In this case, we leave next containing the
1743 first data line. This might actually be several lines because of the
1744 continuation logic applied above, but that doesn't matter.
1745
1746 It turns out that smail, and presumably sendmail, accept leading lines
1747 of the form
1748
1749 From ph10 Fri Jan 5 12:35 GMT 1996
1750
1751 in messages. The "mail" command on Solaris 2 sends such lines. I cannot
1752 find any documentation of this, but for compatibility it had better be
1753 accepted. Exim restricts it to the case of non-smtp messages, and
1754 treats it as an alternative to the -f command line option. Thus it is
1755 ignored except for trusted users or filter testing. Otherwise it is taken
1756 as the sender address, unless -f was used (sendmail compatibility).
1757
1758 It further turns out that some UUCPs generate the From_line in a different
1759 format, e.g.
1760
1761 From ph10 Fri, 7 Jan 97 14:00:00 GMT
1762
1763 The regex for matching these things is now capable of recognizing both
1764 formats (including 2- and 4-digit years in the latter). In fact, the regex
1765 is now configurable, as is the expansion string to fish out the sender.
1766
1767 Even further on it has been discovered that some broken clients send
1768 these lines in SMTP messages. There is now an option to ignore them from
1769 specified hosts or networks. Sigh. */
1770
1771 if (header_last == header_list &&
1772 (!smtp_input
1773 ||
1774 (sender_host_address != NULL &&
1775 verify_check_host(&ignore_fromline_hosts) == OK)
1776 ||
1777 (sender_host_address == NULL && ignore_fromline_local)
1778 ) &&
1779 regex_match_and_setup(regex_From, next->text, 0, -1))
1780 {
1781 if (!sender_address_forced)
1782 {
1783 uschar *uucp_sender = expand_string(uucp_from_sender);
1784 if (uucp_sender == NULL)
1785 {
1786 log_write(0, LOG_MAIN|LOG_PANIC,
1787 "expansion of \"%s\" failed after matching "
1788 "\"From \" line: %s", uucp_from_sender, expand_string_message);
1789 }
1790 else
1791 {
1792 int start, end, domain;
1793 uschar *errmess;
1794 uschar *newsender = parse_extract_address(uucp_sender, &errmess,
1795 &start, &end, &domain, TRUE);
1796 if (newsender != NULL)
1797 {
1798 if (domain == 0 && newsender[0] != 0)
1799 newsender = rewrite_address_qualify(newsender, FALSE);
1800
1801 if (filter_test != FTEST_NONE || receive_check_set_sender(newsender))
1802 {
1803 sender_address = newsender;
1804
1805 if (trusted_caller || filter_test != FTEST_NONE)
1806 {
1807 authenticated_sender = NULL;
1808 originator_name = US"";
1809 sender_local = FALSE;
1810 }
1811
1812 if (filter_test != FTEST_NONE)
1813 printf("Sender taken from \"From \" line\n");
1814 }
1815 }
1816 }
1817 }
1818 }
1819
1820 /* Not a leading "From " line. Check to see if it is a valid header line.
1821 Header names may contain any non-control characters except space and colon,
1822 amazingly. */
1823
1824 else
1825 {
1826 uschar *p = next->text;
1827
1828 /* If not a valid header line, break from the header reading loop, leaving
1829 next != NULL, indicating that it holds the first line of the body. */
1830
1831 if (isspace(*p)) break;
1832 while (mac_isgraph(*p) && *p != ':') p++;
1833 while (isspace(*p)) p++;
1834 if (*p != ':')
1835 {
1836 body_zerocount = had_zero;
1837 break;
1838 }
1839
1840 /* We have a valid header line. If there were any binary zeroes in
1841 the line, stomp on them here. */
1842
1843 if (had_zero > 0)
1844 for (p = next->text; p < next->text + ptr; p++) if (*p == 0) *p = '?';
1845
1846 /* It is perfectly legal to have an empty continuation line
1847 at the end of a header, but it is confusing to humans
1848 looking at such messages, since it looks like a blank line.
1849 Reduce confusion by removing redundant white space at the
1850 end. We know that there is at least one printing character
1851 (the ':' tested for above) so there is no danger of running
1852 off the end. */
1853
1854 p = next->text + ptr - 2;
1855 for (;;)
1856 {
1857 while (*p == ' ' || *p == '\t') p--;
1858 if (*p != '\n') break;
1859 ptr = (p--) - next->text + 1;
1860 message_size -= next->slen - ptr;
1861 next->text[ptr] = 0;
1862 next->slen = ptr;
1863 }
1864
1865 /* Add the header to the chain */
1866
1867 next->type = htype_other;
1868 next->next = NULL;
1869 header_last->next = next;
1870 header_last = next;
1871
1872 /* Check the limit for individual line lengths. This comes after adding to
1873 the chain so that the failing line is reflected if a bounce is generated
1874 (for a local message). */
1875
1876 if (header_line_maxsize > 0 && next->slen > header_line_maxsize)
1877 {
1878 log_write(0, LOG_MAIN, "overlong message header line received from "
1879 "%s (more than %d characters): message abandoned",
1880 sender_host_unknown? sender_ident : sender_fullhost,
1881 header_line_maxsize);
1882
1883 if (smtp_input)
1884 {
1885 smtp_reply = US"552 A message header line is too long";
1886 receive_swallow_smtp();
1887 goto TIDYUP; /* Skip to end of function */
1888 }
1889
1890 else
1891 {
1892 give_local_error(ERRMESS_VLONGHDRLINE,
1893 string_sprintf("message header line longer than %d characters "
1894 "received: message not accepted", header_line_maxsize), US"",
1895 error_rc, stdin, header_list->next);
1896 /* Does not return */
1897 }
1898 }
1899
1900 /* Note if any resent- fields exist. */
1901
1902 if (!resents_exist && strncmpic(next->text, US"resent-", 7) == 0)
1903 {
1904 resents_exist = TRUE;
1905 resent_prefix = US"Resent-";
1906 }
1907 }
1908
1909 /* The line has been handled. If we have hit EOF, break out of the loop,
1910 indicating no pending data line. */
1911
1912 if (ch == EOF) { next = NULL; break; }
1913
1914 /* Set up for the next header */
1915
1916 header_size = 256;
1917 next = store_get(sizeof(header_line));
1918 next->text = store_get(header_size);
1919 ptr = 0;
1920 had_zero = 0;
1921 prevlines_length = 0;
1922 } /* Continue, starting to read the next header */
1923
1924 /* At this point, we have read all the headers into a data structure in main
1925 store. The first header is still the dummy placeholder for the Received: header
1926 we are going to generate a bit later on. If next != NULL, it contains the first
1927 data line - which terminated the headers before reaching a blank line (not the
1928 normal case). */
1929
1930 DEBUG(D_receive)
1931 {
1932 debug_printf(">>Headers received:\n");
1933 for (h = header_list->next; h != NULL; h = h->next)
1934 debug_printf("%s", h->text);
1935 debug_printf("\n");
1936 }
1937
1938 /* End of file on any SMTP connection is an error. If an incoming SMTP call
1939 is dropped immediately after valid headers, the next thing we will see is EOF.
1940 We must test for this specially, as further down the reading of the data is
1941 skipped if already at EOF. */
1942
1943 if (smtp_input && (receive_feof)())
1944 {
1945 smtp_reply = handle_lost_connection(US" (after header)");
1946 smtp_yield = FALSE;
1947 goto TIDYUP; /* Skip to end of function */
1948 }
1949
1950 /* If this is a filter test run and no headers were read, output a warning
1951 in case there is a mistake in the test message. */
1952
1953 if (filter_test != FTEST_NONE && header_list->next == NULL)
1954 printf("Warning: no message headers read\n");
1955
1956
1957 /* Scan the headers to identify them. Some are merely marked for later
1958 processing; some are dealt with here. */
1959
1960 for (h = header_list->next; h != NULL; h = h->next)
1961 {
1962 BOOL is_resent = strncmpic(h->text, US"resent-", 7) == 0;
1963 if (is_resent) contains_resent_headers = TRUE;
1964
1965 switch (header_checkname(h, is_resent))
1966 {
1967 case htype_bcc:
1968 h->type = htype_bcc; /* Both Bcc: and Resent-Bcc: */
1969 break;
1970
1971 case htype_cc:
1972 h->type = htype_cc; /* Both Cc: and Resent-Cc: */
1973 break;
1974
1975 /* Record whether a Date: or Resent-Date: header exists, as appropriate. */
1976
1977 case htype_date:
1978 if (!resents_exist || is_resent) date_header_exists = TRUE;
1979 break;
1980
1981 /* Same comments as about Return-Path: below. */
1982
1983 case htype_delivery_date:
1984 if (delivery_date_remove) h->type = htype_old;
1985 break;
1986
1987 /* Same comments as about Return-Path: below. */
1988
1989 case htype_envelope_to:
1990 if (envelope_to_remove) h->type = htype_old;
1991 break;
1992
1993 /* Mark all "From:" headers so they get rewritten. Save the one that is to
1994 be used for Sender: checking. For Sendmail compatibility, if the "From:"
1995 header consists of just the login id of the user who called Exim, rewrite
1996 it with the gecos field first. Apply this rule to Resent-From: if there
1997 are resent- fields. */
1998
1999 case htype_from:
2000 h->type = htype_from;
2001 if (!resents_exist || is_resent)
2002 {
2003 from_header = h;
2004 if (!smtp_input)
2005 {
2006 uschar *s = Ustrchr(h->text, ':') + 1;
2007 while (isspace(*s)) s++;
2008 if (strncmpic(s, originator_login, h->slen - (s - h->text) - 1) == 0)
2009 {
2010 uschar *name = is_resent? US"Resent-From" : US"From";
2011 header_add(htype_from, "%s: %s <%s@%s>\n", name, originator_name,
2012 originator_login, qualify_domain_sender);
2013 from_header = header_last;
2014 h->type = htype_old;
2015 DEBUG(D_receive|D_rewrite)
2016 debug_printf("rewrote \"%s:\" header using gecos\n", name);
2017 }
2018 }
2019 }
2020 break;
2021
2022 /* Identify the Message-id: header for generating "in-reply-to" in the
2023 autoreply transport. For incoming logging, save any resent- value. In both
2024 cases, take just the first of any multiples. */
2025
2026 case htype_id:
2027 if (msgid_header == NULL && (!resents_exist || is_resent))
2028 {
2029 msgid_header = h;
2030 h->type = htype_id;
2031 }
2032 break;
2033
2034 /* Flag all Received: headers */
2035
2036 case htype_received:
2037 h->type = htype_received;
2038 received_count++;
2039 break;
2040
2041 /* "Reply-to:" is just noted (there is no resent-reply-to field) */
2042
2043 case htype_reply_to:
2044 h->type = htype_reply_to;
2045 break;
2046
2047 /* The Return-path: header is supposed to be added to messages when
2048 they leave the SMTP system. We shouldn't receive messages that already
2049 contain Return-path. However, since Exim generates Return-path: on
2050 local delivery, resent messages may well contain it. We therefore
2051 provide an option (which defaults on) to remove any Return-path: headers
2052 on input. Removal actually means flagging as "old", which prevents the
2053 header being transmitted with the message. */
2054
2055 case htype_return_path:
2056 if (return_path_remove) h->type = htype_old;
2057
2058 /* If we are testing a mail filter file, use the value of the
2059 Return-Path: header to set up the return_path variable, which is not
2060 otherwise set. However, remove any <> that surround the address
2061 because the variable doesn't have these. */
2062
2063 if (filter_test != FTEST_NONE)
2064 {
2065 uschar *start = h->text + 12;
2066 uschar *end = start + Ustrlen(start);
2067 while (isspace(*start)) start++;
2068 while (end > start && isspace(end[-1])) end--;
2069 if (*start == '<' && end[-1] == '>')
2070 {
2071 start++;
2072 end--;
2073 }
2074 return_path = string_copyn(start, end - start);
2075 printf("Return-path taken from \"Return-path:\" header line\n");
2076 }
2077 break;
2078
2079 /* If there is a "Sender:" header and the message is locally originated,
2080 and from an untrusted caller and suppress_local_fixups is not set, or if we
2081 are in submission mode for a remote message, mark it "old" so that it will
2082 not be transmitted with the message, unless active_local_sender_retain is
2083 set. (This can only be true if active_local_from_check is false.) If there
2084 are any resent- headers in the message, apply this rule to Resent-Sender:
2085 instead of Sender:. Messages with multiple resent- header sets cannot be
2086 tidily handled. (For this reason, at least one MUA - Pine - turns old
2087 resent- headers into X-resent- headers when resending, leaving just one
2088 set.) */
2089
2090 case htype_sender:
2091 h->type = ((!active_local_sender_retain &&
2092 (
2093 (sender_local && !trusted_caller && !suppress_local_fixups)
2094 || submission_mode
2095 )
2096 ) &&
2097 (!resents_exist||is_resent))?
2098 htype_old : htype_sender;
2099 break;
2100
2101 /* Remember the Subject: header for logging. There is no Resent-Subject */
2102
2103 case htype_subject:
2104 subject_header = h;
2105 break;
2106
2107 /* "To:" gets flagged, and the existence of a recipient header is noted,
2108 whether it's resent- or not. */
2109
2110 case htype_to:
2111 h->type = htype_to;
2112 /****
2113 to_or_cc_header_exists = TRUE;
2114 ****/
2115 break;
2116 }
2117 }
2118
2119 /* Extract recipients from the headers if that is required (the -t option).
2120 Note that this is documented as being done *before* any address rewriting takes
2121 place. There are two possibilities:
2122
2123 (1) According to sendmail documentation for Solaris, IRIX, and HP-UX, any
2124 recipients already listed are to be REMOVED from the message. Smail 3 works
2125 like this. We need to build a non-recipients tree for that list, because in
2126 subsequent processing this data is held in a tree and that's what the
2127 spool_write_header() function expects. Make sure that non-recipient addresses
2128 are fully qualified and rewritten if necessary.
2129
2130 (2) According to other sendmail documentation, -t ADDS extracted recipients to
2131 those in the command line arguments (and it is rumoured some other MTAs do
2132 this). Therefore, there is an option to make Exim behave this way.
2133
2134 *** Notes on "Resent-" header lines ***
2135
2136 The presence of resent-headers in the message makes -t horribly ambiguous.
2137 Experiments with sendmail showed that it uses recipients for all resent-
2138 headers, totally ignoring the concept of "sets of resent- headers" as described
2139 in RFC 2822 section 3.6.6. Sendmail also amalgamates them into a single set
2140 with all the addresses in one instance of each header.
2141
2142 This seems to me not to be at all sensible. Before release 4.20, Exim 4 gave an
2143 error for -t if there were resent- headers in the message. However, after a
2144 discussion on the mailing list, I've learned that there are MUAs that use
2145 resent- headers with -t, and also that the stuff about sets of resent- headers
2146 and their ordering in RFC 2822 is generally ignored. An MUA that submits a
2147 message with -t and resent- header lines makes sure that only *its* resent-
2148 headers are present; previous ones are often renamed as X-resent- for example.
2149
2150 Consequently, Exim has been changed so that, if any resent- header lines are
2151 present, the recipients are taken from all of the appropriate resent- lines,
2152 and not from the ordinary To:, Cc:, etc. */
2153
2154 if (extract_recip)
2155 {
2156 int rcount = 0;
2157 error_block **bnext = &bad_addresses;
2158
2159 if (extract_addresses_remove_arguments)
2160 {
2161 while (recipients_count-- > 0)
2162 {
2163 uschar *s = rewrite_address(recipients_list[recipients_count].address,
2164 TRUE, TRUE, global_rewrite_rules, rewrite_existflags);
2165 tree_add_nonrecipient(s);
2166 }
2167 recipients_list = NULL;
2168 recipients_count = recipients_list_max = 0;
2169 }
2170
2171 /* Now scan the headers */
2172
2173 for (h = header_list->next; h != NULL; h = h->next)
2174 {
2175 if ((h->type == htype_to || h->type == htype_cc || h->type == htype_bcc) &&
2176 (!contains_resent_headers || strncmpic(h->text, US"resent-", 7) == 0))
2177 {
2178 uschar *s = Ustrchr(h->text, ':') + 1;
2179 while (isspace(*s)) s++;
2180
2181 parse_allow_group = TRUE; /* Allow address group syntax */
2182
2183 while (*s != 0)
2184 {
2185 uschar *ss = parse_find_address_end(s, FALSE);
2186 uschar *recipient, *errmess, *p, *pp;
2187 int start, end, domain;
2188
2189 /* Check on maximum */
2190
2191 if (recipients_max > 0 && ++rcount > recipients_max)
2192 {
2193 give_local_error(ERRMESS_TOOMANYRECIP, US"too many recipients",
2194 US"message rejected: ", error_rc, stdin, NULL);
2195 /* Does not return */
2196 }
2197
2198 /* Make a copy of the address, and remove any internal newlines. These
2199 may be present as a result of continuations of the header line. The
2200 white space that follows the newline must not be removed - it is part
2201 of the header. */
2202
2203 pp = recipient = store_get(ss - s + 1);
2204 for (p = s; p < ss; p++) if (*p != '\n') *pp++ = *p;
2205 *pp = 0;
2206 recipient = parse_extract_address(recipient, &errmess, &start, &end,
2207 &domain, FALSE);
2208
2209 /* Keep a list of all the bad addresses so we can send a single
2210 error message at the end. However, an empty address is not an error;
2211 just ignore it. This can come from an empty group list like
2212
2213 To: Recipients of list:;
2214
2215 If there are no recipients at all, an error will occur later. */
2216
2217 if (recipient == NULL && Ustrcmp(errmess, "empty address") != 0)
2218 {
2219 int len = Ustrlen(s);
2220 error_block *b = store_get(sizeof(error_block));
2221 while (len > 0 && isspace(s[len-1])) len--;
2222 b->next = NULL;
2223 b->text1 = string_printing(string_copyn(s, len));
2224 b->text2 = errmess;
2225 *bnext = b;
2226 bnext = &(b->next);
2227 }
2228
2229 /* If the recipient is already in the nonrecipients tree, it must
2230 have appeared on the command line with the option extract_addresses_
2231 remove_arguments set. Do not add it to the recipients, and keep a note
2232 that this has happened, in order to give a better error if there are
2233 no recipients left. */
2234
2235 else if (recipient != NULL)
2236 {
2237 if (tree_search(tree_nonrecipients, recipient) == NULL)
2238 receive_add_recipient(recipient, -1);
2239 else
2240 extracted_ignored = TRUE;
2241 }
2242
2243 /* Move on past this address */
2244
2245 s = ss + (*ss? 1:0);
2246 while (isspace(*s)) s++;
2247 } /* Next address */
2248
2249 parse_allow_group = FALSE; /* Reset group syntax flags */
2250 parse_found_group = FALSE;
2251
2252 /* If this was the bcc: header, mark it "old", which means it
2253 will be kept on the spool, but not transmitted as part of the
2254 message. */
2255
2256 if (h->type == htype_bcc) h->type = htype_old;
2257 } /* For appropriate header line */
2258 } /* For each header line */
2259
2260 }
2261
2262 /* Now build the unique message id. This has changed several times over the
2263 lifetime of Exim. This description was rewritten for Exim 4.14 (February 2003).
2264 Retaining all the history in the comment has become too unwieldy - read
2265 previous release sources if you want it.
2266
2267 The message ID has 3 parts: tttttt-pppppp-ss. Each part is a number in base 62.
2268 The first part is the current time, in seconds. The second part is the current
2269 pid. Both are large enough to hold 32-bit numbers in base 62. The third part
2270 can hold a number in the range 0-3843. It used to be a computed sequence
2271 number, but is now the fractional component of the current time in units of
2272 1/2000 of a second (i.e. a value in the range 0-1999). After a message has been
2273 received, Exim ensures that the timer has ticked at the appropriate level
2274 before proceeding, to avoid duplication if the pid happened to be re-used
2275 within the same time period. It seems likely that most messages will take at
2276 least half a millisecond to be received, so no delay will normally be
2277 necessary. At least for some time...
2278
2279 There is a modification when localhost_number is set. Formerly this was allowed
2280 to be as large as 255. Now it is restricted to the range 0-16, and the final
2281 component of the message id becomes (localhost_number * 200) + fractional time
2282 in units of 1/200 of a second (i.e. a value in the range 0-3399).
2283
2284 Some not-really-Unix operating systems use case-insensitive file names (Darwin,
2285 Cygwin). For these, we have to use base 36 instead of base 62. Luckily, this
2286 still allows the tttttt field to hold a large enough number to last for some
2287 more decades, and the final two-digit field can hold numbers up to 1295, which
2288 is enough for milliseconds (instead of 1/2000 of a second).
2289
2290 However, the pppppp field cannot hold a 32-bit pid, but it can hold a 31-bit
2291 pid, so it is probably safe because pids have to be positive. The
2292 localhost_number is restricted to 0-10 for these hosts, and when it is set, the
2293 final field becomes (localhost_number * 100) + fractional time in centiseconds.
2294
2295 Note that string_base62() returns its data in a static storage block, so it
2296 must be copied before calling string_base62() again. It always returns exactly
2297 6 characters.
2298
2299 There doesn't seem to be anything in the RFC which requires a message id to
2300 start with a letter, but Smail was changed to ensure this. The external form of
2301 the message id (as supplied by string expansion) therefore starts with an
2302 additional leading 'E'. The spool file names do not include this leading
2303 letter and it is not used internally.
2304
2305 NOTE: If ever the format of message ids is changed, the regular expression for
2306 checking that a string is in this format must be updated in a corresponding
2307 way. It appears in the initializing code in exim.c. The macro MESSAGE_ID_LENGTH
2308 must also be changed to reflect the correct string length. Then, of course,
2309 other programs that rely on the message id format will need updating too. */
2310
2311 Ustrncpy(message_id, string_base62((long int)(message_id_tv.tv_sec)), 6);
2312 message_id[6] = '-';
2313 Ustrncpy(message_id + 7, string_base62((long int)getpid()), 6);
2314
2315 /* Deal with the case where the host number is set. The value of the number was
2316 checked when it was read, to ensure it isn't too big. The timing granularity is
2317 left in id_resolution so that an appropriate wait can be done after receiving
2318 the message, if necessary (we hope it won't be). */
2319
2320 if (host_number_string != NULL)
2321 {
2322 id_resolution = (BASE_62 == 62)? 5000 : 10000;
2323 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2324 string_base62((long int)(
2325 host_number * (1000000/id_resolution) +
2326 message_id_tv.tv_usec/id_resolution)) + 4);
2327 }
2328
2329 /* Host number not set: final field is just the fractional time at an
2330 appropriate resolution. */
2331
2332 else
2333 {
2334 id_resolution = (BASE_62 == 62)? 500 : 1000;
2335 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2336 string_base62((long int)(message_id_tv.tv_usec/id_resolution)) + 4);
2337 }
2338
2339 /* Add the current message id onto the current process info string if
2340 it will fit. */
2341
2342 (void)string_format(process_info + process_info_len,
2343 PROCESS_INFO_SIZE - process_info_len, " id=%s", message_id);
2344
2345 /* If we are using multiple input directories, set up the one for this message
2346 to be the least significant base-62 digit of the time of arrival. Otherwise
2347 ensure that it is an empty string. */
2348
2349 message_subdir[0] = split_spool_directory? message_id[5] : 0;
2350
2351 /* Now that we have the message-id, if there is no message-id: header, generate
2352 one, but only for local (without suppress_local_fixups) or submission mode
2353 messages. This can be user-configured if required, but we had better flatten
2354 any illegal characters therein. */
2355
2356 if (msgid_header == NULL &&
2357 ((sender_host_address == NULL && !suppress_local_fixups)
2358 || submission_mode))
2359 {
2360 uschar *p;
2361 uschar *id_text = US"";
2362 uschar *id_domain = primary_hostname;
2363
2364 /* Permit only letters, digits, dots, and hyphens in the domain */
2365
2366 if (message_id_domain != NULL)
2367 {
2368 uschar *new_id_domain = expand_string(message_id_domain);
2369 if (new_id_domain == NULL)
2370 {
2371 if (!expand_string_forcedfail)
2372 log_write(0, LOG_MAIN|LOG_PANIC,
2373 "expansion of \"%s\" (message_id_header_domain) "
2374 "failed: %s", message_id_domain, expand_string_message);
2375 }
2376 else if (*new_id_domain != 0)
2377 {
2378 id_domain = new_id_domain;
2379 for (p = id_domain; *p != 0; p++)
2380 if (!isalnum(*p) && *p != '.') *p = '-'; /* No need to test '-' ! */
2381 }
2382 }
2383
2384 /* Permit all characters except controls and RFC 2822 specials in the
2385 additional text part. */
2386
2387 if (message_id_text != NULL)
2388 {
2389 uschar *new_id_text = expand_string(message_id_text);
2390 if (new_id_text == NULL)
2391 {
2392 if (!expand_string_forcedfail)
2393 log_write(0, LOG_MAIN|LOG_PANIC,
2394 "expansion of \"%s\" (message_id_header_text) "
2395 "failed: %s", message_id_text, expand_string_message);
2396 }
2397 else if (*new_id_text != 0)
2398 {
2399 id_text = new_id_text;
2400 for (p = id_text; *p != 0; p++)
2401 if (mac_iscntrl_or_special(*p)) *p = '-';
2402 }
2403 }
2404
2405 /* Add the header line
2406 * Resent-* headers are prepended, per RFC 5322 3.6.6. Non-Resent-* are
2407 * appended, to preserve classical expectations of header ordering. */
2408
2409 header_add_at_position(!resents_exist, NULL, FALSE, htype_id,
2410 "%sMessage-Id: <%s%s%s@%s>\n", resent_prefix, message_id_external,
2411 (*id_text == 0)? "" : ".", id_text, id_domain);
2412 }
2413
2414 /* If we are to log recipients, keep a copy of the raw ones before any possible
2415 rewriting. Must copy the count, because later ACLs and the local_scan()
2416 function may mess with the real recipients. */
2417
2418 if ((log_extra_selector & LX_received_recipients) != 0)
2419 {
2420 raw_recipients = store_get(recipients_count * sizeof(uschar *));
2421 for (i = 0; i < recipients_count; i++)
2422 raw_recipients[i] = string_copy(recipients_list[i].address);
2423 raw_recipients_count = recipients_count;
2424 }
2425
2426 /* Ensure the recipients list is fully qualified and rewritten. Unqualified
2427 recipients will get here only if the conditions were right (allow_unqualified_
2428 recipient is TRUE). */
2429
2430 for (i = 0; i < recipients_count; i++)
2431 recipients_list[i].address =
2432 rewrite_address(recipients_list[i].address, TRUE, TRUE,
2433 global_rewrite_rules, rewrite_existflags);
2434
2435 /* If there is no From: header, generate one for local (without
2436 suppress_local_fixups) or submission_mode messages. If there is no sender
2437 address, but the sender is local or this is a local delivery error, use the
2438 originator login. This shouldn't happen for genuine bounces, but might happen
2439 for autoreplies. The addition of From: must be done *before* checking for the
2440 possible addition of a Sender: header, because untrusted_set_sender allows an
2441 untrusted user to set anything in the envelope (which might then get info
2442 From:) but we still want to ensure a valid Sender: if it is required. */
2443
2444 if (from_header == NULL &&
2445 ((sender_host_address == NULL && !suppress_local_fixups)
2446 || submission_mode))
2447 {
2448 uschar *oname = US"";
2449
2450 /* Use the originator_name if this is a locally submitted message and the
2451 caller is not trusted. For trusted callers, use it only if -F was used to
2452 force its value or if we have a non-SMTP message for which -f was not used
2453 to set the sender. */
2454
2455 if (sender_host_address == NULL)
2456 {
2457 if (!trusted_caller || sender_name_forced ||
2458 (!smtp_input && !sender_address_forced))
2459 oname = originator_name;
2460 }
2461
2462 /* For non-locally submitted messages, the only time we use the originator
2463 name is when it was forced by the /name= option on control=submission. */
2464
2465 else
2466 {
2467 if (submission_name != NULL) oname = submission_name;
2468 }
2469
2470 /* Envelope sender is empty */
2471
2472 if (sender_address[0] == 0)
2473 {
2474 uschar *fromstart, *fromend;
2475
2476 fromstart = string_sprintf("%sFrom: %s%s", resent_prefix,
2477 oname, (oname[0] == 0)? "" : " <");
2478 fromend = (oname[0] == 0)? US"" : US">";
2479
2480 if (sender_local || local_error_message)
2481 {
2482 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2483 local_part_quote(originator_login), qualify_domain_sender,
2484 fromend);
2485 }
2486 else if (submission_mode && authenticated_id != NULL)
2487 {
2488 if (submission_domain == NULL)
2489 {
2490 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2491 local_part_quote(authenticated_id), qualify_domain_sender,
2492 fromend);
2493 }
2494 else if (submission_domain[0] == 0) /* empty => whole address set */
2495 {
2496 header_add(htype_from, "%s%s%s\n", fromstart, authenticated_id,
2497 fromend);
2498 }
2499 else
2500 {
2501 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2502 local_part_quote(authenticated_id), submission_domain,
2503 fromend);
2504 }
2505 from_header = header_last; /* To get it checked for Sender: */
2506 }
2507 }
2508
2509 /* There is a non-null envelope sender. Build the header using the original
2510 sender address, before any rewriting that might have been done while
2511 verifying it. */
2512
2513 else
2514 {
2515 header_add(htype_from, "%sFrom: %s%s%s%s\n", resent_prefix,
2516 oname,
2517 (oname[0] == 0)? "" : " <",
2518 (sender_address_unrewritten == NULL)?
2519 sender_address : sender_address_unrewritten,
2520 (oname[0] == 0)? "" : ">");
2521
2522 from_header = header_last; /* To get it checked for Sender: */
2523 }
2524 }
2525
2526
2527 /* If the sender is local (without suppress_local_fixups), or if we are in
2528 submission mode and there is an authenticated_id, check that an existing From:
2529 is correct, and if not, generate a Sender: header, unless disabled. Any
2530 previously-existing Sender: header was removed above. Note that sender_local,
2531 as well as being TRUE if the caller of exim is not trusted, is also true if a
2532 trusted caller did not supply a -f argument for non-smtp input. To allow
2533 trusted callers to forge From: without supplying -f, we have to test explicitly
2534 here. If the From: header contains more than one address, then the call to
2535 parse_extract_address fails, and a Sender: header is inserted, as required. */
2536
2537 if (from_header != NULL &&
2538 (active_local_from_check &&
2539 ((sender_local && !trusted_caller && !suppress_local_fixups) ||
2540 (submission_mode && authenticated_id != NULL))
2541 ))
2542 {
2543 BOOL make_sender = TRUE;
2544 int start, end, domain;
2545 uschar *errmess;
2546 uschar *from_address =
2547 parse_extract_address(Ustrchr(from_header->text, ':') + 1, &errmess,
2548 &start, &end, &domain, FALSE);
2549 uschar *generated_sender_address;
2550
2551 if (submission_mode)
2552 {
2553 if (submission_domain == NULL)
2554 {
2555 generated_sender_address = string_sprintf("%s@%s",
2556 local_part_quote(authenticated_id), qualify_domain_sender);
2557 }
2558 else if (submission_domain[0] == 0) /* empty => full address */
2559 {
2560 generated_sender_address = string_sprintf("%s",
2561 authenticated_id);
2562 }
2563 else
2564 {
2565 generated_sender_address = string_sprintf("%s@%s",
2566 local_part_quote(authenticated_id), submission_domain);
2567 }
2568 }
2569 else
2570 generated_sender_address = string_sprintf("%s@%s",
2571 local_part_quote(originator_login), qualify_domain_sender);
2572
2573 /* Remove permitted prefixes and suffixes from the local part of the From:
2574 address before doing the comparison with the generated sender. */
2575
2576 if (from_address != NULL)
2577 {
2578 int slen;
2579 uschar *at = (domain == 0)? NULL : from_address + domain - 1;
2580
2581 if (at != NULL) *at = 0;
2582 from_address += route_check_prefix(from_address, local_from_prefix);
2583 slen = route_check_suffix(from_address, local_from_suffix);
2584 if (slen > 0)
2585 {
2586 memmove(from_address+slen, from_address, Ustrlen(from_address)-slen);
2587 from_address += slen;
2588 }
2589 if (at != NULL) *at = '@';
2590
2591 if (strcmpic(generated_sender_address, from_address) == 0 ||
2592 (domain == 0 && strcmpic(from_address, originator_login) == 0))
2593 make_sender = FALSE;
2594 }
2595
2596 /* We have to cause the Sender header to be rewritten if there are
2597 appropriate rewriting rules. */
2598
2599 if (make_sender)
2600 {
2601 if (submission_mode && submission_name == NULL)
2602 header_add(htype_sender, "%sSender: %s\n", resent_prefix,
2603 generated_sender_address);
2604 else
2605 header_add(htype_sender, "%sSender: %s <%s>\n",
2606 resent_prefix,
2607 submission_mode? submission_name : originator_name,
2608 generated_sender_address);
2609 }
2610
2611 /* Ensure that a non-null envelope sender address corresponds to the
2612 submission mode sender address. */
2613
2614 if (submission_mode && sender_address[0] != 0)
2615 {
2616 if (sender_address_unrewritten == NULL)
2617 sender_address_unrewritten = sender_address;
2618 sender_address = generated_sender_address;
2619 if (Ustrcmp(sender_address_unrewritten, generated_sender_address) != 0)
2620 log_write(L_address_rewrite, LOG_MAIN,
2621 "\"%s\" from env-from rewritten as \"%s\" by submission mode",
2622 sender_address_unrewritten, generated_sender_address);
2623 }
2624 }
2625
2626
2627 /* If there are any rewriting rules, apply them to the sender address, unless
2628 it has already been rewritten as part of verification for SMTP input. */
2629
2630 if (global_rewrite_rules != NULL && sender_address_unrewritten == NULL &&
2631 sender_address[0] != 0)
2632 {
2633 sender_address = rewrite_address(sender_address, FALSE, TRUE,
2634 global_rewrite_rules, rewrite_existflags);
2635 DEBUG(D_receive|D_rewrite)
2636 debug_printf("rewritten sender = %s\n", sender_address);
2637 }
2638
2639
2640 /* The headers must be run through rewrite_header(), because it ensures that
2641 addresses are fully qualified, as well as applying any rewriting rules that may
2642 exist.
2643
2644 Qualification of header addresses in a message from a remote host happens only
2645 if the host is in sender_unqualified_hosts or recipient_unqualified hosts, as
2646 appropriate. For local messages, qualification always happens, unless -bnq is
2647 used to explicitly suppress it. No rewriting is done for an unqualified address
2648 that is left untouched.
2649
2650 We start at the second header, skipping our own Received:. This rewriting is
2651 documented as happening *after* recipient addresses are taken from the headers
2652 by the -t command line option. An added Sender: gets rewritten here. */
2653
2654 for (h = header_list->next; h != NULL; h = h->next)
2655 {
2656 header_line *newh = rewrite_header(h, NULL, NULL, global_rewrite_rules,
2657 rewrite_existflags, TRUE);
2658 if (newh != NULL) h = newh;
2659 }
2660
2661
2662 /* An RFC 822 (sic) message is not legal unless it has at least one of "to",
2663 "cc", or "bcc". Note that although the minimal examples in RFC 822 show just
2664 "to" or "bcc", the full syntax spec allows "cc" as well. If any resent- header
2665 exists, this applies to the set of resent- headers rather than the normal set.
2666
2667 The requirement for a recipient header has been removed in RFC 2822. At this
2668 point in the code, earlier versions of Exim added a To: header for locally
2669 submitted messages, and an empty Bcc: header for others. In the light of the
2670 changes in RFC 2822, this was dropped in November 2003. */
2671
2672
2673 /* If there is no date header, generate one if the message originates locally
2674 (i.e. not over TCP/IP) and suppress_local_fixups is not set, or if the
2675 submission mode flag is set. Messages without Date: are not valid, but it seems
2676 to be more confusing if Exim adds one to all remotely-originated messages.
2677 As per Message-Id, we prepend if resending, else append.
2678 */
2679
2680 if (!date_header_exists &&
2681 ((sender_host_address == NULL && !suppress_local_fixups)
2682 || submission_mode))
2683 header_add_at_position(!resents_exist, NULL, FALSE, htype_other,
2684 "%sDate: %s\n", resent_prefix, tod_stamp(tod_full));
2685
2686 search_tidyup(); /* Free any cached resources */
2687
2688 /* Show the complete set of headers if debugging. Note that the first one (the
2689 new Received:) has not yet been set. */
2690
2691 DEBUG(D_receive)
2692 {
2693 debug_printf(">>Headers after rewriting and local additions:\n");
2694 for (h = header_list->next; h != NULL; h = h->next)
2695 debug_printf("%c %s", h->type, h->text);
2696 debug_printf("\n");
2697 }
2698
2699 /* The headers are now complete in store. If we are running in filter
2700 testing mode, that is all this function does. Return TRUE if the message
2701 ended with a dot. */
2702
2703 if (filter_test != FTEST_NONE)
2704 {
2705 process_info[process_info_len] = 0;
2706 return message_ended == END_DOT;
2707 }
2708
2709 /* Cutthrough delivery:
2710 We have to create the Received header now rather than at the end of reception,
2711 so the timestamp behaviour is a change to the normal case.
2712 XXX Ensure this gets documented XXX.
2713 Having created it, send the headers to the destination.
2714 */
2715 if (cutthrough_fd >= 0)
2716 {
2717 if (received_count > received_headers_max)
2718 {
2719 cancel_cutthrough_connection();
2720 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2721 log_write(0, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2722 "Too many \"Received\" headers",
2723 sender_address,
2724 (sender_fullhost == NULL)? "" : " H=",
2725 (sender_fullhost == NULL)? US"" : sender_fullhost,
2726 (sender_ident == NULL)? "" : " U=",
2727 (sender_ident == NULL)? US"" : sender_ident);
2728 message_id[0] = 0; /* Indicate no message accepted */
2729 smtp_reply = US"550 Too many \"Received\" headers - suspected mail loop";
2730 goto TIDYUP; /* Skip to end of function */
2731 }
2732 received_header_gen();
2733 add_acl_headers(US"MAIL or RCPT");
2734 (void) cutthrough_headers_send();
2735 }
2736
2737
2738 /* Open a new spool file for the data portion of the message. We need
2739 to access it both via a file descriptor and a stream. Try to make the
2740 directory if it isn't there. Note re use of sprintf: spool_directory
2741 is checked on input to be < 200 characters long. */
2742
2743 sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory, message_subdir,
2744 message_id);
2745 data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2746 if (data_fd < 0)
2747 {
2748 if (errno == ENOENT)
2749 {
2750 uschar temp[16];
2751 sprintf(CS temp, "input/%s", message_subdir);
2752 if (message_subdir[0] == 0) temp[5] = 0;
2753 (void)directory_make(spool_directory, temp, INPUT_DIRECTORY_MODE, TRUE);
2754 data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2755 }
2756 if (data_fd < 0)
2757 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Failed to create spool file %s: %s",
2758 spool_name, strerror(errno));
2759 }
2760
2761 /* Make sure the file's group is the Exim gid, and double-check the mode
2762 because the group setting doesn't always get set automatically. */
2763
2764 (void)fchown(data_fd, exim_uid, exim_gid);
2765 (void)fchmod(data_fd, SPOOL_MODE);
2766
2767 /* We now have data file open. Build a stream for it and lock it. We lock only
2768 the first line of the file (containing the message ID) because otherwise there
2769 are problems when Exim is run under Cygwin (I'm told). See comments in
2770 spool_in.c, where the same locking is done. */
2771
2772 data_file = fdopen(data_fd, "w+");
2773 lock_data.l_type = F_WRLCK;
2774 lock_data.l_whence = SEEK_SET;
2775 lock_data.l_start = 0;
2776 lock_data.l_len = SPOOL_DATA_START_OFFSET;
2777
2778 if (fcntl(data_fd, F_SETLK, &lock_data) < 0)
2779 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Cannot lock %s (%d): %s", spool_name,
2780 errno, strerror(errno));
2781
2782 /* We have an open, locked data file. Write the message id to it to make it
2783 self-identifying. Then read the remainder of the input of this message and
2784 write it to the data file. If the variable next != NULL, it contains the first
2785 data line (which was read as a header but then turned out not to have the right
2786 format); write it (remembering that it might contain binary zeros). The result
2787 of fwrite() isn't inspected; instead we call ferror() below. */
2788
2789 fprintf(data_file, "%s-D\n", message_id);
2790 if (next != NULL)
2791 {
2792 uschar *s = next->text;
2793 int len = next->slen;
2794 (void)fwrite(s, 1, len, data_file);
2795 body_linecount++; /* Assumes only 1 line */
2796 }
2797
2798 /* Note that we might already be at end of file, or the logical end of file
2799 (indicated by '.'), or might have encountered an error while writing the
2800 message id or "next" line. */
2801
2802 if (!ferror(data_file) && !(receive_feof)() && message_ended != END_DOT)
2803 {
2804 if (smtp_input)
2805 {
2806 message_ended = read_message_data_smtp(data_file);
2807 receive_linecount++; /* The terminating "." line */
2808 }
2809 else message_ended = read_message_data(data_file);
2810
2811 receive_linecount += body_linecount; /* For BSMTP errors mainly */
2812 message_linecount += body_linecount;
2813
2814 /* Handle premature termination of SMTP */
2815
2816 if (smtp_input && message_ended == END_EOF)
2817 {
2818 Uunlink(spool_name); /* Lose data file when closed */
2819 cancel_cutthrough_connection();
2820 message_id[0] = 0; /* Indicate no message accepted */
2821 smtp_reply = handle_lost_connection(US"");
2822 smtp_yield = FALSE;
2823 goto TIDYUP; /* Skip to end of function */
2824 }
2825
2826 /* Handle message that is too big. Don't use host_or_ident() in the log
2827 message; we want to see the ident value even for non-remote messages. */
2828
2829 if (message_ended == END_SIZE)
2830 {
2831 Uunlink(spool_name); /* Lose the data file when closed */
2832 cancel_cutthrough_connection();
2833 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2834
2835 log_write(L_size_reject, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2836 "message too big: read=%d max=%d",
2837 sender_address,
2838 (sender_fullhost == NULL)? "" : " H=",
2839 (sender_fullhost == NULL)? US"" : sender_fullhost,
2840 (sender_ident == NULL)? "" : " U=",
2841 (sender_ident == NULL)? US"" : sender_ident,
2842 message_size,
2843 thismessage_size_limit);
2844
2845 if (smtp_input)
2846 {
2847 smtp_reply = US"552 Message size exceeds maximum permitted";
2848 message_id[0] = 0; /* Indicate no message accepted */
2849 goto TIDYUP; /* Skip to end of function */
2850 }
2851 else
2852 {
2853 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2854 give_local_error(ERRMESS_TOOBIG,
2855 string_sprintf("message too big (max=%d)", thismessage_size_limit),
2856 US"message rejected: ", error_rc, data_file, header_list);
2857 /* Does not return */
2858 }
2859 }
2860 }
2861
2862 /* Restore the standard SIGALRM handler for any subsequent processing. (For
2863 example, there may be some expansion in an ACL that uses a timer.) */
2864
2865 os_non_restarting_signal(SIGALRM, sigalrm_handler);
2866
2867 /* The message body has now been read into the data file. Call fflush() to
2868 empty the buffers in C, and then call fsync() to get the data written out onto
2869 the disk, as fflush() doesn't do this (or at least, it isn't documented as
2870 having to do this). If there was an I/O error on either input or output,
2871 attempt to send an error message, and unlink the spool file. For non-SMTP input
2872 we can then give up. Note that for SMTP input we must swallow the remainder of
2873 the input in cases of output errors, since the far end doesn't expect to see
2874 anything until the terminating dot line is sent. */
2875
2876 if (fflush(data_file) == EOF || ferror(data_file) ||
2877 EXIMfsync(fileno(data_file)) < 0 || (receive_ferror)())
2878 {
2879 uschar *msg_errno = US strerror(errno);
2880 BOOL input_error = (receive_ferror)() != 0;
2881 uschar *msg = string_sprintf("%s error (%s) while receiving message from %s",
2882 input_error? "Input read" : "Spool write",
2883 msg_errno,
2884 (sender_fullhost != NULL)? sender_fullhost : sender_ident);
2885
2886 log_write(0, LOG_MAIN, "Message abandoned: %s", msg);
2887 Uunlink(spool_name); /* Lose the data file */
2888 cancel_cutthrough_connection();
2889
2890 if (smtp_input)
2891 {
2892 if (input_error)
2893 smtp_reply = US"451 Error while reading input data";
2894 else
2895 {
2896 smtp_reply = US"451 Error while writing spool file";
2897 receive_swallow_smtp();
2898 }
2899 message_id[0] = 0; /* Indicate no message accepted */
2900 goto TIDYUP; /* Skip to end of function */
2901 }
2902
2903 else
2904 {
2905 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2906 give_local_error(ERRMESS_IOERR, msg, US"", error_rc, data_file,
2907 header_list);
2908 /* Does not return */
2909 }
2910 }
2911
2912
2913 /* No I/O errors were encountered while writing the data file. */
2914
2915 DEBUG(D_receive) debug_printf("Data file written for message %s\n", message_id);
2916
2917
2918 /* If there were any bad addresses extracted by -t, or there were no recipients
2919 left after -t, send a message to the sender of this message, or write it to
2920 stderr if the error handling option is set that way. Note that there may
2921 legitimately be no recipients for an SMTP message if they have all been removed
2922 by "discard".
2923
2924 We need to rewind the data file in order to read it. In the case of no
2925 recipients or stderr error writing, throw the data file away afterwards, and
2926 exit. (This can't be SMTP, which always ensures there's at least one
2927 syntactically good recipient address.) */
2928
2929 if (extract_recip && (bad_addresses != NULL || recipients_count == 0))
2930 {
2931 DEBUG(D_receive)
2932 {
2933 if (recipients_count == 0) debug_printf("*** No recipients\n");
2934 if (bad_addresses != NULL)
2935 {
2936 error_block *eblock = bad_addresses;
2937 debug_printf("*** Bad address(es)\n");
2938 while (eblock != NULL)
2939 {
2940 debug_printf(" %s: %s\n", eblock->text1, eblock->text2);
2941 eblock = eblock->next;
2942 }
2943 }
2944 }
2945
2946 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2947
2948 /* If configured to send errors to the sender, but this fails, force
2949 a failure error code. We use a special one for no recipients so that it
2950 can be detected by the autoreply transport. Otherwise error_rc is set to
2951 errors_sender_rc, which is EXIT_FAILURE unless -oee was given, in which case
2952 it is EXIT_SUCCESS. */
2953
2954 if (error_handling == ERRORS_SENDER)
2955 {
2956 if (!moan_to_sender(
2957 (bad_addresses == NULL)?
2958 (extracted_ignored? ERRMESS_IGADDRESS : ERRMESS_NOADDRESS) :
2959 (recipients_list == NULL)? ERRMESS_BADNOADDRESS : ERRMESS_BADADDRESS,
2960 bad_addresses, header_list, data_file, FALSE))
2961 error_rc = (bad_addresses == NULL)? EXIT_NORECIPIENTS : EXIT_FAILURE;
2962 }
2963 else
2964 {
2965 if (bad_addresses == NULL)
2966 {
2967 if (extracted_ignored)
2968 fprintf(stderr, "exim: all -t recipients overridden by command line\n");
2969 else
2970 fprintf(stderr, "exim: no recipients in message\n");
2971 }
2972 else
2973 {
2974 fprintf(stderr, "exim: invalid address%s",
2975 (bad_addresses->next == NULL)? ":" : "es:\n");
2976 while (bad_addresses != NULL)
2977 {
2978 fprintf(stderr, " %s: %s\n", bad_addresses->text1,
2979 bad_addresses->text2);
2980 bad_addresses = bad_addresses->next;
2981 }
2982 }
2983 }
2984
2985 if (recipients_count == 0 || error_handling == ERRORS_STDERR)
2986 {
2987 Uunlink(spool_name);
2988 (void)fclose(data_file);
2989 exim_exit(error_rc);
2990 }
2991 }
2992
2993 /* Data file successfully written. Generate text for the Received: header by
2994 expanding the configured string, and adding a timestamp. By leaving this
2995 operation till now, we ensure that the timestamp is the time that message
2996 reception was completed. However, this is deliberately done before calling the
2997 data ACL and local_scan().
2998
2999 This Received: header may therefore be inspected by the data ACL and by code in
3000 the local_scan() function. When they have run, we update the timestamp to be
3001 the final time of reception.
3002
3003 If there is just one recipient, set up its value in the $received_for variable
3004 for use when we generate the Received: header.
3005
3006 Note: the checking for too many Received: headers is handled by the delivery
3007 code. */
3008 /*XXX eventually add excess Received: check for cutthrough case back when classifying them */
3009
3010 if (received_header->text == NULL) /* Non-cutthrough case */
3011 {
3012 received_header_gen();
3013
3014 /* Set the value of message_body_size for the DATA ACL and for local_scan() */
3015
3016 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3017 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
3018
3019 /* If an ACL from any RCPT commands set up any warning headers to add, do so
3020 now, before running the DATA ACL. */
3021
3022 add_acl_headers(US"MAIL or RCPT");
3023 }
3024 else
3025 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3026 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
3027
3028 /* If an ACL is specified for checking things at this stage of reception of a
3029 message, run it, unless all the recipients were removed by "discard" in earlier
3030 ACLs. That is the only case in which recipients_count can be zero at this
3031 stage. Set deliver_datafile to point to the data file so that $message_body and
3032 $message_body_end can be extracted if needed. Allow $recipients in expansions.
3033 */
3034
3035 deliver_datafile = data_fd;
3036 user_msg = NULL;
3037
3038 enable_dollar_recipients = TRUE;
3039
3040 if (recipients_count == 0)
3041 {
3042 blackholed_by = recipients_discarded? US"MAIL ACL" : US"RCPT ACL";
3043 }
3044 else
3045 {
3046 /* Handle interactive SMTP messages */
3047
3048 if (smtp_input && !smtp_batched_input)
3049 {
3050
3051 #ifndef DISABLE_DKIM
3052 if (!dkim_disable_verify)
3053 {
3054 /* Finish verification, this will log individual signature results to
3055 the mainlog */
3056 dkim_exim_verify_finish();
3057
3058 /* Check if we must run the DKIM ACL */
3059 if ((acl_smtp_dkim != NULL) &&
3060 (dkim_verify_signers != NULL) &&
3061 (dkim_verify_signers[0] != '\0'))
3062 {
3063 uschar *dkim_verify_signers_expanded =
3064 expand_string(dkim_verify_signers);
3065 if (dkim_verify_signers_expanded == NULL)
3066 {
3067 log_write(0, LOG_MAIN|LOG_PANIC,
3068 "expansion of dkim_verify_signers option failed: %s",
3069 expand_string_message);
3070 }
3071 else
3072 {
3073 int sep = 0;
3074 uschar *ptr = dkim_verify_signers_expanded;
3075 uschar *item = NULL;
3076 uschar *seen_items = NULL;
3077 int seen_items_size = 0;
3078 int seen_items_offset = 0;
3079 uschar itembuf[256];
3080 /* Default to OK when no items are present */
3081 rc = OK;
3082 while ((item = string_nextinlist(&ptr, &sep,
3083 itembuf,
3084 sizeof(itembuf))) != NULL)
3085 {
3086 /* Prevent running ACL for an empty item */
3087 if (!item || (item[0] == '\0')) continue;
3088 /* Only run ACL once for each domain or identity, no matter how often it
3089 appears in the expanded list. */
3090 if (seen_items != NULL)
3091 {
3092 uschar *seen_item = NULL;
3093 uschar seen_item_buf[256];
3094 uschar *seen_items_list = seen_items;
3095 int seen_this_item = 0;
3096
3097 while ((seen_item = string_nextinlist(&seen_items_list, &sep,
3098 seen_item_buf,
3099 sizeof(seen_item_buf))) != NULL)
3100 {
3101 if (Ustrcmp(seen_item,item) == 0)
3102 {
3103 seen_this_item = 1;
3104 break;
3105 }
3106 }
3107
3108 if (seen_this_item > 0)
3109 {
3110 DEBUG(D_receive)
3111 debug_printf("acl_smtp_dkim: skipping signer %s, already seen\n", item);
3112 continue;
3113 }
3114
3115 seen_items = string_append(seen_items,&seen_items_size,&seen_items_offset,1,":");
3116 }
3117
3118 seen_items = string_append(seen_items,&seen_items_size,&seen_items_offset,1,item);
3119 seen_items[seen_items_offset] = '\0';
3120
3121 DEBUG(D_receive)
3122 debug_printf("calling acl_smtp_dkim for dkim_cur_signer=%s\n", item);
3123
3124 dkim_exim_acl_setup(item);
3125 rc = acl_check(ACL_WHERE_DKIM, NULL, acl_smtp_dkim, &user_msg, &log_msg);
3126
3127 if (rc != OK)
3128 {
3129 DEBUG(D_receive)
3130 debug_printf("acl_smtp_dkim: acl_check returned %d on %s, skipping remaining items\n", rc, item);
3131 cancel_cutthrough_connection();
3132 break;
3133 }
3134 }
3135 add_acl_headers(US"DKIM");
3136 if (rc == DISCARD)
3137 {
3138 recipients_count = 0;
3139 blackholed_by = US"DKIM ACL";
3140 if (log_msg != NULL)
3141 blackhole_log_msg = string_sprintf(": %s", log_msg);
3142 }
3143 else if (rc != OK)
3144 {
3145 Uunlink(spool_name);
3146 if (smtp_handle_acl_fail(ACL_WHERE_DKIM, rc, user_msg, log_msg) != 0)
3147 smtp_yield = FALSE; /* No more messsages after dropped connection */
3148 smtp_reply = US""; /* Indicate reply already sent */
3149 message_id[0] = 0; /* Indicate no message accepted */
3150 goto TIDYUP; /* Skip to end of function */
3151 }
3152 }
3153 }
3154 }
3155 #endif /* DISABLE_DKIM */
3156
3157 #ifdef WITH_CONTENT_SCAN
3158 if (recipients_count > 0 &&
3159 acl_smtp_mime != NULL &&
3160 !run_mime_acl(acl_smtp_mime, &smtp_yield, &smtp_reply, &blackholed_by))
3161 goto TIDYUP;
3162 #endif /* WITH_CONTENT_SCAN */
3163
3164 /* Check the recipients count again, as the MIME ACL might have changed
3165 them. */
3166
3167 if (acl_smtp_data != NULL && recipients_count > 0)
3168 {
3169 rc = acl_check(ACL_WHERE_DATA, NULL, acl_smtp_data, &user_msg, &log_msg);
3170 add_acl_headers(US"DATA");
3171 if (rc == DISCARD)
3172 {
3173 recipients_count = 0;
3174 blackholed_by = US"DATA ACL";
3175 if (log_msg != NULL)
3176 blackhole_log_msg = string_sprintf(": %s", log_msg);
3177 cancel_cutthrough_connection();
3178 }
3179 else if (rc != OK)
3180 {
3181 Uunlink(spool_name);
3182 cancel_cutthrough_connection();
3183 #ifdef WITH_CONTENT_SCAN
3184 unspool_mbox();
3185 #endif
3186 #ifdef EXPERIMENTAL_DCC
3187 dcc_ok = 0;
3188 #endif
3189 if (smtp_handle_acl_fail(ACL_WHERE_DATA, rc, user_msg, log_msg) != 0)
3190 smtp_yield = FALSE; /* No more messsages after dropped connection */
3191 smtp_reply = US""; /* Indicate reply already sent */
3192 message_id[0] = 0; /* Indicate no message accepted */
3193 goto TIDYUP; /* Skip to end of function */
3194 }
3195 }
3196 }
3197
3198 /* Handle non-SMTP and batch SMTP (i.e. non-interactive) messages. Note that
3199 we cannot take different actions for permanent and temporary rejections. */
3200
3201 else
3202 {
3203
3204 #ifdef WITH_CONTENT_SCAN
3205 if (acl_not_smtp_mime != NULL &&
3206 !run_mime_acl(acl_not_smtp_mime, &smtp_yield, &smtp_reply,
3207 &blackholed_by))
3208 goto TIDYUP;
3209 #endif /* WITH_CONTENT_SCAN */
3210
3211 if (acl_not_smtp != NULL)
3212 {
3213 uschar *user_msg, *log_msg;
3214 rc = acl_check(ACL_WHERE_NOTSMTP, NULL, acl_not_smtp, &user_msg, &log_msg);
3215 if (rc == DISCARD)
3216 {
3217 recipients_count = 0;
3218 blackholed_by = US"non-SMTP ACL";
3219 if (log_msg != NULL)
3220 blackhole_log_msg = string_sprintf(": %s", log_msg);
3221 }
3222 else if (rc != OK)
3223 {
3224 Uunlink(spool_name);
3225 #ifdef WITH_CONTENT_SCAN
3226 unspool_mbox();
3227 #endif
3228 #ifdef EXPERIMENTAL_DCC
3229 dcc_ok = 0;
3230 #endif
3231 /* The ACL can specify where rejections are to be logged, possibly
3232 nowhere. The default is main and reject logs. */
3233
3234 if (log_reject_target != 0)
3235 log_write(0, log_reject_target, "F=<%s> rejected by non-SMTP ACL: %s",
3236 sender_address, log_msg);
3237
3238 if (user_msg == NULL) user_msg = US"local configuration problem";
3239 if (smtp_batched_input)
3240 {
3241 moan_smtp_batch(NULL, "%d %s", 550, user_msg);
3242 /* Does not return */
3243 }
3244 else
3245 {
3246 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3247 give_local_error(ERRMESS_LOCAL_ACL, user_msg,
3248 US"message rejected by non-SMTP ACL: ", error_rc, data_file,
3249 header_list);
3250 /* Does not return */
3251 }
3252 }
3253 add_acl_headers(US"non-SMTP");
3254 }
3255 }
3256
3257 /* The applicable ACLs have been run */
3258
3259 if (deliver_freeze) frozen_by = US"ACL"; /* for later logging */
3260 if (queue_only_policy) queued_by = US"ACL";
3261 }
3262
3263 #ifdef WITH_CONTENT_SCAN
3264 unspool_mbox();
3265 #endif
3266
3267 #ifdef EXPERIMENTAL_DCC
3268 dcc_ok = 0;
3269 #endif
3270
3271
3272 /* The final check on the message is to run the scan_local() function. The
3273 version supplied with Exim always accepts, but this is a hook for sysadmins to
3274 supply their own checking code. The local_scan() function is run even when all
3275 the recipients have been discarded. */
3276
3277 lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3278
3279 /* Arrange to catch crashes in local_scan(), so that the -D file gets
3280 deleted, and the incident gets logged. */
3281
3282 os_non_restarting_signal(SIGSEGV, local_scan_crash_handler);
3283 os_non_restarting_signal(SIGFPE, local_scan_crash_handler);
3284 os_non_restarting_signal(SIGILL, local_scan_crash_handler);
3285 os_non_restarting_signal(SIGBUS, local_scan_crash_handler);
3286
3287 DEBUG(D_receive) debug_printf("calling local_scan(); timeout=%d\n",
3288 local_scan_timeout);
3289 local_scan_data = NULL;
3290
3291 os_non_restarting_signal(SIGALRM, local_scan_timeout_handler);
3292 if (local_scan_timeout > 0) alarm(local_scan_timeout);
3293 rc = local_scan(data_fd, &local_scan_data);
3294 alarm(0);
3295 os_non_restarting_signal(SIGALRM, sigalrm_handler);
3296
3297 enable_dollar_recipients = FALSE;
3298
3299 store_pool = POOL_MAIN; /* In case changed */
3300 DEBUG(D_receive) debug_printf("local_scan() returned %d %s\n", rc,
3301 local_scan_data);
3302
3303 os_non_restarting_signal(SIGSEGV, SIG_DFL);
3304 os_non_restarting_signal(SIGFPE, SIG_DFL);
3305 os_non_restarting_signal(SIGILL, SIG_DFL);
3306 os_non_restarting_signal(SIGBUS, SIG_DFL);
3307
3308 /* The length check is paranoia against some runaway code, and also because
3309 (for a success return) lines in the spool file are read into big_buffer. */
3310
3311 if (local_scan_data != NULL)
3312 {
3313 int len = Ustrlen(local_scan_data);
3314 if (len > LOCAL_SCAN_MAX_RETURN) len = LOCAL_SCAN_MAX_RETURN;
3315 local_scan_data = string_copyn(local_scan_data, len);
3316 }
3317
3318 if (rc == LOCAL_SCAN_ACCEPT_FREEZE)
3319 {
3320 if (!deliver_freeze) /* ACL might have already frozen */
3321 {
3322 deliver_freeze = TRUE;
3323 deliver_frozen_at = time(NULL);
3324 frozen_by = US"local_scan()";
3325 }
3326 rc = LOCAL_SCAN_ACCEPT;
3327 }
3328 else if (rc == LOCAL_SCAN_ACCEPT_QUEUE)
3329 {
3330 if (!queue_only_policy) /* ACL might have already queued */
3331 {
3332 queue_only_policy = TRUE;
3333 queued_by = US"local_scan()";
3334 }
3335 rc = LOCAL_SCAN_ACCEPT;
3336 }
3337
3338 /* Message accepted: remove newlines in local_scan_data because otherwise
3339 the spool file gets corrupted. Ensure that all recipients are qualified. */
3340
3341 if (rc == LOCAL_SCAN_ACCEPT)
3342 {
3343 if (local_scan_data != NULL)
3344 {
3345 uschar *s;
3346 for (s = local_scan_data; *s != 0; s++) if (*s == '\n') *s = ' ';
3347 }
3348 for (i = 0; i < recipients_count; i++)
3349 {
3350 recipient_item *r = recipients_list + i;
3351 r->address = rewrite_address_qualify(r->address, TRUE);
3352 if (r->errors_to != NULL)
3353 r->errors_to = rewrite_address_qualify(r->errors_to, TRUE);
3354 }
3355 if (recipients_count == 0 && blackholed_by == NULL)
3356 blackholed_by = US"local_scan";
3357 }
3358
3359 /* Message rejected: newlines permitted in local_scan_data to generate
3360 multiline SMTP responses. */
3361
3362 else
3363 {
3364 uschar *istemp = US"";
3365 uschar *s = NULL;
3366 uschar *smtp_code;
3367 int size = 0;
3368 int sptr = 0;
3369
3370 errmsg = local_scan_data;
3371
3372 Uunlink(spool_name); /* Cancel this message */
3373 switch(rc)
3374 {
3375 default:
3376 log_write(0, LOG_MAIN, "invalid return %d from local_scan(). Temporary "
3377 "rejection given", rc);
3378 goto TEMPREJECT;
3379
3380 case LOCAL_SCAN_REJECT_NOLOGHDR:
3381 log_extra_selector &= ~LX_rejected_header;
3382 /* Fall through */
3383
3384 case LOCAL_SCAN_REJECT:
3385 smtp_code = US"550";
3386 if (errmsg == NULL) errmsg = US"Administrative prohibition";
3387 break;
3388
3389 case LOCAL_SCAN_TEMPREJECT_NOLOGHDR:
3390 log_extra_selector &= ~LX_rejected_header;
3391 /* Fall through */
3392
3393 case LOCAL_SCAN_TEMPREJECT:
3394 TEMPREJECT:
3395 smtp_code = US"451";
3396 if (errmsg == NULL) errmsg = US"Temporary local problem";
3397 istemp = US"temporarily ";
3398 break;
3399 }
3400
3401 s = string_append(s, &size, &sptr, 2, US"F=",
3402 (sender_address[0] == 0)? US"<>" : sender_address);
3403 s = add_host_info_for_log(s, &size, &sptr);
3404 s[sptr] = 0;
3405
3406 log_write(0, LOG_MAIN|LOG_REJECT, "%s %srejected by local_scan(): %.256s",
3407 s, istemp, string_printing(errmsg));
3408
3409 if (smtp_input)
3410 {
3411 if (!smtp_batched_input)
3412 {
3413 smtp_respond(smtp_code, 3, TRUE, errmsg);
3414 message_id[0] = 0; /* Indicate no message accepted */
3415 smtp_reply = US""; /* Indicate reply already sent */
3416 goto TIDYUP; /* Skip to end of function */
3417 }
3418 else
3419 {
3420 moan_smtp_batch(NULL, "%s %s", smtp_code, errmsg);
3421 /* Does not return */
3422 }
3423 }
3424 else
3425 {
3426 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3427 give_local_error(ERRMESS_LOCAL_SCAN, errmsg,
3428 US"message rejected by local scan code: ", error_rc, data_file,
3429 header_list);
3430 /* Does not return */
3431 }
3432 }
3433
3434 /* Reset signal handlers to ignore signals that previously would have caused
3435 the message to be abandoned. */
3436
3437 signal(SIGTERM, SIG_IGN);
3438 signal(SIGINT, SIG_IGN);
3439
3440
3441 /* Ensure the first time flag is set in the newly-received message. */
3442
3443 deliver_firsttime = TRUE;
3444
3445 #ifdef EXPERIMENTAL_BRIGHTMAIL
3446 if (bmi_run == 1) {
3447 /* rewind data file */
3448 lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3449 bmi_verdicts = bmi_process_message(header_list, data_fd);
3450 };
3451 #endif
3452
3453 /* Update the timstamp in our Received: header to account for any time taken by
3454 an ACL or by local_scan(). The new time is the time that all reception
3455 processing is complete. */
3456
3457 timestamp = expand_string(US"${tod_full}");
3458 tslen = Ustrlen(timestamp);
3459
3460 memcpy(received_header->text + received_header->slen - tslen - 1,
3461 timestamp, tslen);
3462
3463 /* In MUA wrapper mode, ignore queueing actions set by ACL or local_scan() */
3464
3465 if (mua_wrapper)
3466 {
3467 deliver_freeze = FALSE;
3468 queue_only_policy = FALSE;
3469 }
3470
3471 /* Keep the data file open until we have written the header file, in order to
3472 hold onto the lock. In a -bh run, or if the message is to be blackholed, we
3473 don't write the header file, and we unlink the data file. If writing the header
3474 file fails, we have failed to accept this message. */
3475
3476 if (host_checking || blackholed_by != NULL)
3477 {
3478 header_line *h;
3479 Uunlink(spool_name);
3480 msg_size = 0; /* Compute size for log line */
3481 for (h = header_list; h != NULL; h = h->next)
3482 if (h->type != '*') msg_size += h->slen;
3483 }
3484
3485 /* Write the -H file */
3486
3487 else
3488 {
3489 if ((msg_size = spool_write_header(message_id, SW_RECEIVING, &errmsg)) < 0)
3490 {
3491 log_write(0, LOG_MAIN, "Message abandoned: %s", errmsg);
3492 Uunlink(spool_name); /* Lose the data file */
3493
3494 if (smtp_input)
3495 {
3496 smtp_reply = US"451 Error in writing spool file";
3497 message_id[0] = 0; /* Indicate no message accepted */
3498 goto TIDYUP;
3499 }
3500 else
3501 {
3502 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3503 give_local_error(ERRMESS_IOERR, errmsg, US"", error_rc, data_file,
3504 header_list);
3505 /* Does not return */
3506 }
3507 }
3508 }
3509
3510
3511 /* The message has now been successfully received. */
3512
3513 receive_messagecount++;
3514
3515 /* In SMTP sessions we may receive several in one connection. After each one,
3516 we wait for the clock to tick at the level of message-id granularity. This is
3517 so that the combination of time+pid is unique, even on systems where the pid
3518 can be re-used within our time interval. We can't shorten the interval without
3519 re-designing the message-id. See comments above where the message id is
3520 created. This is Something For The Future. */
3521
3522 message_id_tv.tv_usec = (message_id_tv.tv_usec/id_resolution) * id_resolution;
3523 exim_wait_tick(&message_id_tv, id_resolution);
3524
3525 /* Add data size to written header size. We do not count the initial file name
3526 that is in the file, but we do add one extra for the notional blank line that
3527 precedes the data. This total differs from message_size in that it include the
3528 added Received: header and any other headers that got created locally. */
3529
3530 fflush(data_file);
3531 fstat(data_fd, &statbuf);
3532
3533 msg_size += statbuf.st_size - SPOOL_DATA_START_OFFSET + 1;
3534
3535 /* Generate a "message received" log entry. We do this by building up a dynamic
3536 string as required. Since we commonly want to add two items at a time, use a
3537 macro to simplify the coding. We log the arrival of a new message while the
3538 file is still locked, just in case the machine is *really* fast, and delivers
3539 it first! Include any message id that is in the message - since the syntax of a
3540 message id is actually an addr-spec, we can use the parse routine to canonicize
3541 it. */
3542
3543 size = 256;
3544 sptr = 0;
3545 s = store_get(size);
3546
3547 s = string_append(s, &size, &sptr, 2, US"<= ",
3548 (sender_address[0] == 0)? US"<>" : sender_address);
3549 if (message_reference != NULL)
3550 s = string_append(s, &size, &sptr, 2, US" R=", message_reference);
3551
3552 s = add_host_info_for_log(s, &size, &sptr);
3553
3554 #ifdef SUPPORT_TLS
3555 if ((log_extra_selector & LX_tls_cipher) != 0 && tls_in.cipher != NULL)
3556 s = string_append(s, &size, &sptr, 2, US" X=", tls_in.cipher);
3557 if ((log_extra_selector & LX_tls_certificate_verified) != 0 &&
3558 tls_in.cipher != NULL)
3559 s = string_append(s, &size, &sptr, 2, US" CV=",
3560 tls_in.certificate_verified? "yes":"no");
3561 if ((log_extra_selector & LX_tls_peerdn) != 0 && tls_in.peerdn != NULL)
3562 s = string_append(s, &size, &sptr, 3, US" DN=\"",
3563 string_printing(tls_in.peerdn), US"\"");
3564 if ((log_extra_selector & LX_tls_sni) != 0 && tls_in.sni != NULL)
3565 s = string_append(s, &size, &sptr, 3, US" SNI=\"",
3566 string_printing(tls_in.sni), US"\"");
3567 #endif
3568
3569 if (sender_host_authenticated != NULL)
3570 {
3571 s = string_append(s, &size, &sptr, 2, US" A=", sender_host_authenticated);
3572 if (authenticated_id != NULL)
3573 s = string_append(s, &size, &sptr, 2, US":", authenticated_id);
3574 }
3575
3576 sprintf(CS big_buffer, "%d", msg_size);
3577 s = string_append(s, &size, &sptr, 2, US" S=", big_buffer);
3578
3579 /* If an addr-spec in a message-id contains a quoted string, it can contain
3580 any characters except " \ and CR and so in particular it can contain NL!
3581 Therefore, make sure we use a printing-characters only version for the log.
3582 Also, allow for domain literals in the message id. */
3583
3584 if (msgid_header != NULL)
3585 {
3586 uschar *old_id;
3587 BOOL save_allow_domain_literals = allow_domain_literals;
3588 allow_domain_literals = TRUE;
3589 old_id = parse_extract_address(Ustrchr(msgid_header->text, ':') + 1,
3590 &errmsg, &start, &end, &domain, FALSE);
3591 allow_domain_literals = save_allow_domain_literals;
3592 if (old_id != NULL)
3593 s = string_append(s, &size, &sptr, 2, US" id=", string_printing(old_id));
3594 }
3595
3596 /* If subject logging is turned on, create suitable printing-character
3597 text. By expanding $h_subject: we make use of the MIME decoding. */
3598
3599 if ((log_extra_selector & LX_subject) != 0 && subject_header != NULL)
3600 {
3601 int i;
3602 uschar *p = big_buffer;
3603 uschar *ss = expand_string(US"$h_subject:");
3604
3605 /* Backslash-quote any double quotes or backslashes so as to make a
3606 a C-like string, and turn any non-printers into escape sequences. */
3607
3608 *p++ = '\"';
3609 if (*ss != 0) for (i = 0; i < 100 && ss[i] != 0; i++)
3610 {
3611 if (ss[i] == '\"' || ss[i] == '\\') *p++ = '\\';
3612 *p++ = ss[i];
3613 }
3614 *p++ = '\"';
3615 *p = 0;
3616 s = string_append(s, &size, &sptr, 2, US" T=", string_printing(big_buffer));
3617 }
3618
3619 /* Terminate the string: string_cat() and string_append() leave room, but do
3620 not put the zero in. */
3621
3622 s[sptr] = 0;
3623
3624 /* Create a message log file if message logs are being used and this message is
3625 not blackholed. Write the reception stuff to it. We used to leave message log
3626 creation until the first delivery, but this has proved confusing for some
3627 people. */
3628
3629 if (message_logs && blackholed_by == NULL)
3630 {
3631 int fd;
3632
3633 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory, message_subdir,
3634 message_id);
3635 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3636
3637 if (fd < 0 && errno == ENOENT)
3638 {
3639 uschar temp[16];
3640 sprintf(CS temp, "msglog/%s", message_subdir);
3641 if (message_subdir[0] == 0) temp[6] = 0;
3642 (void)directory_make(spool_directory, temp, MSGLOG_DIRECTORY_MODE, TRUE);
3643 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3644 }
3645
3646 if (fd < 0)
3647 {
3648 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't open message log %s: %s",
3649 spool_name, strerror(errno));
3650 }
3651
3652 else
3653 {
3654 FILE *message_log = fdopen(fd, "a");
3655 if (message_log == NULL)
3656 {
3657 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't fdopen message log %s: %s",
3658 spool_name, strerror(errno));
3659 (void)close(fd);
3660 }
3661 else
3662 {
3663 uschar *now = tod_stamp(tod_log);
3664 fprintf(message_log, "%s Received from %s\n", now, s+3);
3665 if (deliver_freeze) fprintf(message_log, "%s frozen by %s\n", now,
3666 frozen_by);
3667 if (queue_only_policy) fprintf(message_log,
3668 "%s no immediate delivery: queued by %s\n", now, queued_by);
3669 (void)fclose(message_log);
3670 }
3671 }
3672 }
3673
3674 /* Everything has now been done for a successful message except logging its
3675 arrival, and outputting an SMTP response. While writing to the log, set a flag
3676 to cause a call to receive_bomb_out() if the log cannot be opened. */
3677
3678 receive_call_bombout = TRUE;
3679
3680 /* Before sending an SMTP response in a TCP/IP session, we check to see if the
3681 connection has gone away. This can only be done if there is no unconsumed input
3682 waiting in the local input buffer. We can test for this by calling
3683 receive_smtp_buffered(). RFC 2920 (pipelining) explicitly allows for additional
3684 input to be sent following the final dot, so the presence of following input is
3685 not an error.
3686
3687 If the connection is still present, but there is no unread input for the
3688 socket, the result of a select() call will be zero. If, however, the connection
3689 has gone away, or if there is pending input, the result of select() will be
3690 non-zero. The two cases can be distinguished by trying to read the next input
3691 character. If we succeed, we can unread it so that it remains in the local
3692 buffer for handling later. If not, the connection has been lost.
3693
3694 Of course, since TCP/IP is asynchronous, there is always a chance that the
3695 connection will vanish between the time of this test and the sending of the
3696 response, but the chance of this happening should be small. */
3697
3698 if (smtp_input && sender_host_address != NULL && !sender_host_notsocket &&
3699 !receive_smtp_buffered())
3700 {
3701 struct timeval tv;
3702 fd_set select_check;
3703 FD_ZERO(&select_check);
3704 FD_SET(fileno(smtp_in), &select_check);
3705 tv.tv_sec = 0;
3706 tv.tv_usec = 0;
3707
3708 if (select(fileno(smtp_in) + 1, &select_check, NULL, NULL, &tv) != 0)
3709 {
3710 int c = (receive_getc)();
3711 if (c != EOF) (receive_ungetc)(c); else
3712 {
3713 uschar *msg = US"SMTP connection lost after final dot";
3714 smtp_reply = US""; /* No attempt to send a response */
3715 smtp_yield = FALSE; /* Nothing more on this connection */
3716
3717 /* Re-use the log line workspace */
3718
3719 sptr = 0;
3720 s = string_cat(s, &size, &sptr, msg, Ustrlen(msg));
3721 s = add_host_info_for_log(s, &size, &sptr);
3722 s[sptr] = 0;
3723 log_write(0, LOG_MAIN, "%s", s);
3724
3725 /* Delete the files for this aborted message. */
3726
3727 sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory,
3728 message_subdir, message_id);
3729 Uunlink(spool_name);
3730
3731 sprintf(CS spool_name, "%s/input/%s/%s-H", spool_directory,
3732 message_subdir, message_id);
3733 Uunlink(spool_name);
3734
3735 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory,
3736 message_subdir, message_id);
3737 Uunlink(spool_name);
3738
3739 goto TIDYUP;
3740 }
3741 }
3742 }
3743
3744 /* The connection has not gone away; we really are going to take responsibility
3745 for this message. */
3746
3747 /* Cutthrough - had sender last-dot; assume we've sent (or bufferred) all
3748 data onward by now.
3749
3750 Send dot onward. If accepted, wipe the spooled files, log as delivered and accept
3751 the sender's dot (below).
3752 If rejected: copy response to sender, wipe the spooled files, log approriately.
3753 If temp-reject: accept to sender, keep the spooled files.
3754
3755 Having the normal spool files lets us do data-filtering, and store/forward on temp-reject.
3756
3757 XXX We do not handle queue-only, freezing, or blackholes.
3758 */
3759 if(cutthrough_fd >= 0)
3760 {
3761 uschar * msg= cutthrough_finaldot(); /* Ask the target system to accept the messsage */
3762 /* Logging was done in finaldot() */
3763 switch(msg[0])
3764 {
3765 case '2': /* Accept. Do the same to the source; dump any spoolfiles. */
3766 cutthrough_done = 3;
3767 break; /* message_id needed for SMTP accept below */
3768
3769 default: /* Unknown response, or error. Treat as temp-reject. */
3770 case '4': /* Temp-reject. Keep spoolfiles and accept. */
3771 cutthrough_done = 1; /* Avoid the usual immediate delivery attempt */
3772 break; /* message_id needed for SMTP accept below */
3773
3774 case '5': /* Perm-reject. Do the same to the source. Dump any spoolfiles */
3775 smtp_reply= msg; /* Pass on the exact error */
3776 cutthrough_done = 2;
3777 break;
3778 }
3779 }
3780 else
3781 cutthrough_done = 0;
3782
3783 if(smtp_reply == NULL)
3784 {
3785 log_write(0, LOG_MAIN |
3786 (((log_extra_selector & LX_received_recipients) != 0)? LOG_RECIPIENTS : 0) |
3787 (((log_extra_selector & LX_received_sender) != 0)? LOG_SENDER : 0),
3788 "%s", s);
3789
3790 /* Log any control actions taken by an ACL or local_scan(). */
3791
3792 if (deliver_freeze) log_write(0, LOG_MAIN, "frozen by %s", frozen_by);
3793 if (queue_only_policy) log_write(L_delay_delivery, LOG_MAIN,
3794 "no immediate delivery: queued by %s", queued_by);
3795 }
3796 receive_call_bombout = FALSE;
3797
3798 store_reset(s); /* The store for the main log message can be reused */
3799
3800 /* If the message is frozen, and freeze_tell is set, do the telling. */
3801
3802 if (deliver_freeze && freeze_tell != NULL && freeze_tell[0] != 0)
3803 {
3804 moan_tell_someone(freeze_tell, NULL, US"Message frozen on arrival",
3805 "Message %s was frozen on arrival by %s.\nThe sender is <%s>.\n",
3806 message_id, frozen_by, sender_address);
3807 }
3808
3809
3810 /* Either a message has been successfully received and written to the two spool
3811 files, or an error in writing the spool has occurred for an SMTP message, or
3812 an SMTP message has been rejected for policy reasons. (For a non-SMTP message
3813 we will have already given up because there's no point in carrying on!) In
3814 either event, we must now close (and thereby unlock) the data file. In the
3815 successful case, this leaves the message on the spool, ready for delivery. In
3816 the error case, the spool file will be deleted. Then tidy up store, interact
3817 with an SMTP call if necessary, and return.
3818
3819 A fflush() was done earlier in the expectation that any write errors on the
3820 data file will be flushed(!) out thereby. Nevertheless, it is theoretically
3821 possible for fclose() to fail - but what to do? What has happened to the lock
3822 if this happens? */
3823
3824
3825 TIDYUP:
3826 process_info[process_info_len] = 0; /* Remove message id */
3827 if (data_file != NULL) (void)fclose(data_file); /* Frees the lock */
3828
3829 /* Now reset signal handlers to their defaults */
3830
3831 signal(SIGTERM, SIG_DFL);
3832 signal(SIGINT, SIG_DFL);
3833
3834 /* Tell an SMTP caller the state of play, and arrange to return the SMTP return
3835 value, which defaults TRUE - meaning there may be more incoming messages from
3836 this connection. For non-SMTP callers (where there is only ever one message),
3837 the default is FALSE. */
3838
3839 if (smtp_input)
3840 {
3841 yield = smtp_yield;
3842
3843 /* Handle interactive SMTP callers. After several kinds of error, smtp_reply
3844 is set to the response that should be sent. When it is NULL, we generate
3845 default responses. After an ACL error or local_scan() error, the response has
3846 already been sent, and smtp_reply is an empty string to indicate this. */
3847
3848 if (!smtp_batched_input)
3849 {
3850 if (smtp_reply == NULL)
3851 {
3852 if (fake_response != OK)
3853 smtp_respond((fake_response == DEFER)? US"450" : US"550", 3, TRUE,
3854 fake_response_text);
3855
3856 /* An OK response is required; use "message" text if present. */
3857
3858 else if (user_msg != NULL)
3859 {
3860 uschar *code = US"250";
3861 int len = 3;
3862 smtp_message_code(&code, &len, &user_msg, NULL);
3863 smtp_respond(code, len, TRUE, user_msg);
3864 }
3865
3866 /* Default OK response */
3867
3868 else
3869 smtp_printf("250 OK id=%s\r\n", message_id);
3870 if (host_checking)
3871 fprintf(stdout,
3872 "\n**** SMTP testing: that is not a real message id!\n\n");
3873 }
3874
3875 /* smtp_reply is set non-empty */
3876
3877 else if (smtp_reply[0] != 0)
3878 {
3879 if (fake_response != OK && (smtp_reply[0] == '2'))
3880 smtp_respond((fake_response == DEFER)? US"450" : US"550", 3, TRUE,
3881 fake_response_text);
3882 else
3883 smtp_printf("%.1024s\r\n", smtp_reply);
3884 }
3885
3886 switch (cutthrough_done)
3887 {
3888 case 3: log_write(0, LOG_MAIN, "Completed"); /* Delivery was done */
3889 case 2: { /* Delete spool files */
3890 sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory,
3891 message_subdir, message_id);
3892 Uunlink(spool_name);
3893 sprintf(CS spool_name, "%s/input/%s/%s-H", spool_directory,
3894 message_subdir, message_id);
3895 Uunlink(spool_name);
3896 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory,
3897 message_subdir, message_id);
3898 Uunlink(spool_name);
3899 }
3900 case 1: message_id[0] = 0; /* Prevent a delivery from starting */
3901 default:break;
3902 }
3903 cutthrough_delivery = FALSE;
3904 }
3905
3906 /* For batched SMTP, generate an error message on failure, and do
3907 nothing on success. The function moan_smtp_batch() does not return -
3908 it exits from the program with a non-zero return code. */
3909
3910 else if (smtp_reply != NULL) moan_smtp_batch(NULL, "%s", smtp_reply);
3911 }
3912
3913
3914 /* If blackholing, we can immediately log this message's sad fate. The data
3915 file has already been unlinked, and the header file was never written to disk.
3916 We must now indicate that nothing was received, to prevent a delivery from
3917 starting. */
3918
3919 if (blackholed_by != NULL)
3920 {
3921 uschar *detail = (local_scan_data != NULL)?
3922 string_printing(local_scan_data) :
3923 string_sprintf("(%s discarded recipients)", blackholed_by);
3924 log_write(0, LOG_MAIN, "=> blackhole %s%s", detail, blackhole_log_msg);
3925 log_write(0, LOG_MAIN, "Completed");
3926 message_id[0] = 0;
3927 }
3928
3929 /* Reset headers so that logging of rejects for a subsequent message doesn't
3930 include them. It is also important to set header_last = NULL before exiting
3931 from this function, as this prevents certain rewrites that might happen during
3932 subsequent verifying (of another incoming message) from trying to add headers
3933 when they shouldn't. */
3934
3935 header_list = header_last = NULL;
3936
3937 return yield; /* TRUE if more messages (SMTP only) */
3938 }
3939
3940 /* End of receive.c */