Remove obsolete commented-out code from receive.c.
[exim.git] / src / src / receive.c
CommitLineData
2cbb4081 1/* $Cambridge: exim/src/src/receive.c,v 1.26 2006/02/14 15:11:43 ph10 Exp $ */
059ec3d9
PH
2
3/*************************************************
4* Exim - an Internet mail transport agent *
5*************************************************/
6
d7d7b7b9 7/* Copyright (c) University of Cambridge 1995 - 2006 */
059ec3d9
PH
8/* See the file NOTICE for conditions of use and distribution. */
9
10/* Code for receiving a message and setting up spool files. */
11
059ec3d9
PH
12#include "exim.h"
13
fb2274d4
TK
14#ifdef EXPERIMENTAL_DOMAINKEYS
15#define RECEIVE_GETC dk_receive_getc
16#define RECEIVE_UNGETC dk_receive_ungetc
17#else
18#define RECEIVE_GETC receive_getc
19#define RECEIVE_UNGETC receive_ungetc
20#endif
059ec3d9
PH
21
22/*************************************************
23* Local static variables *
24*************************************************/
25
26static FILE *data_file = NULL;
27static int data_fd = -1;
28static uschar spool_name[256];
29
30
31
32/*************************************************
33* Non-SMTP character reading functions *
34*************************************************/
35
36/* These are the default functions that are set up in the variables such as
37receive_getc initially. They just call the standard functions, passing stdin as
38the file. (When SMTP input is occurring, different functions are used by
39changing the pointer variables.) */
40
41int
42stdin_getc(void)
43{
44return getc(stdin);
45}
46
47int
48stdin_ungetc(int c)
49{
50return ungetc(c, stdin);
51}
52
53int
54stdin_feof(void)
55{
56return feof(stdin);
57}
58
59int
60stdin_ferror(void)
61{
62return ferror(stdin);
63}
64
65
66
67
68/*************************************************
69* Check that a set sender is allowed *
70*************************************************/
71
72/* This function is called when a local caller sets an explicit sender address.
73It checks whether this is permitted, which it is for trusted callers.
74Otherwise, it must match the pattern(s) in untrusted_set_sender.
75
76Arguments: the proposed sender address
77Returns: TRUE for a trusted caller
78 TRUE if the address has been set, untrusted_set_sender has been
79 set, and the address matches something in the list
80 FALSE otherwise
81*/
82
83BOOL
84receive_check_set_sender(uschar *newsender)
85{
86uschar *qnewsender;
87if (trusted_caller) return TRUE;
88if (newsender == NULL || untrusted_set_sender == NULL) return FALSE;
89qnewsender = (Ustrchr(newsender, '@') != NULL)?
90 newsender : string_sprintf("%s@%s", newsender, qualify_domain_sender);
91return
92 match_address_list(qnewsender, TRUE, TRUE, &untrusted_set_sender, NULL, -1,
93 0, NULL) == OK;
94}
95
96
97
98
99/*************************************************
5cb8cbc6 100* Read space info for a partition *
059ec3d9
PH
101*************************************************/
102
8e669ac1
PH
103/* This function is called by receive_check_fs() below, and also by string
104expansion for variables such as $spool_space. The field names for the statvfs
5cb8cbc6
PH
105structure are macros, because not all OS have F_FAVAIL and it seems tidier to
106have macros for F_BAVAIL and F_FILES as well. Some kinds of file system do not
107have inodes, and they return -1 for the number available.
059ec3d9 108
5cb8cbc6
PH
109Later: It turns out that some file systems that do not have the concept of
110inodes return 0 rather than -1. Such systems should also return 0 for the total
8e669ac1 111number of inodes, so we require that to be greater than zero before returning
5cb8cbc6 112an inode count.
059ec3d9 113
5cb8cbc6
PH
114Arguments:
115 isspool TRUE for spool partition, FALSE for log partition
116 inodeptr address of int to receive inode count; -1 if there isn't one
8e669ac1 117
5cb8cbc6 118Returns: available on-root space, in kilobytes
8e669ac1
PH
119 -1 for log partition if there isn't one
120
121All values are -1 if the STATFS functions are not available.
059ec3d9
PH
122*/
123
8e669ac1 124int
5cb8cbc6 125receive_statvfs(BOOL isspool, int *inodeptr)
059ec3d9
PH
126{
127#ifdef HAVE_STATFS
059ec3d9 128struct STATVFS statbuf;
5cb8cbc6
PH
129uschar *path;
130uschar *name;
131uschar buffer[1024];
059ec3d9 132
5cb8cbc6 133/* The spool directory must always exist. */
059ec3d9 134
5cb8cbc6 135if (isspool)
059ec3d9 136 {
8e669ac1
PH
137 path = spool_directory;
138 name = US"spool";
139 }
140
059ec3d9
PH
141/* Need to cut down the log file path to the directory, and to ignore any
142appearance of "syslog" in it. */
143
5cb8cbc6 144else
059ec3d9 145 {
059ec3d9 146 int sep = ':'; /* Not variable - outside scripts use */
059ec3d9 147 uschar *p = log_file_path;
8e669ac1 148 name = US"log";
059ec3d9
PH
149
150 /* An empty log_file_path means "use the default". This is the same as an
151 empty item in a list. */
152
153 if (*p == 0) p = US":";
154 while ((path = string_nextinlist(&p, &sep, buffer, sizeof(buffer))) != NULL)
155 {
156 if (Ustrcmp(path, "syslog") != 0) break;
157 }
158
5cb8cbc6
PH
159 if (path == NULL) /* No log files */
160 {
8e669ac1
PH
161 *inodeptr = -1;
162 return -1;
163 }
059ec3d9 164
8e669ac1
PH
165 /* An empty string means use the default, which is in the spool directory.
166 But don't just use the spool directory, as it is possible that the log
5cb8cbc6 167 subdirectory has been symbolically linked elsewhere. */
059ec3d9 168
8e669ac1 169 if (path[0] == 0)
059ec3d9 170 {
5cb8cbc6
PH
171 sprintf(CS buffer, CS"%s/log", CS spool_directory);
172 path = buffer;
8e669ac1
PH
173 }
174 else
059ec3d9 175 {
8e669ac1 176 uschar *cp;
5cb8cbc6 177 if ((cp = Ustrrchr(path, '/')) != NULL) *cp = 0;
8e669ac1 178 }
5cb8cbc6 179 }
8e669ac1 180
5cb8cbc6
PH
181/* We now have the patch; do the business */
182
183memset(&statbuf, 0, sizeof(statbuf));
184
185if (STATVFS(CS path, &statbuf) != 0)
186 {
187 log_write(0, LOG_MAIN|LOG_PANIC, "cannot accept message: failed to stat "
188 "%s directory %s: %s", name, spool_directory, strerror(errno));
189 smtp_closedown(US"spool or log directory problem");
190 exim_exit(EXIT_FAILURE);
191 }
8e669ac1 192
5cb8cbc6
PH
193*inodeptr = (statbuf.F_FILES > 0)? statbuf.F_FAVAIL : -1;
194
195/* Disks are getting huge. Take care with computing the size in kilobytes. */
8e669ac1 196
5cb8cbc6
PH
197return (int)(((double)statbuf.F_BAVAIL * (double)statbuf.F_FRSIZE)/1024.0);
198
199/* Unable to find partition sizes in this environment. */
200
201#else
202*inodeptr = -1;
203return -1;
204#endif
205}
206
059ec3d9 207
059ec3d9 208
5cb8cbc6
PH
209
210/*************************************************
211* Check space on spool and log partitions *
212*************************************************/
213
214/* This function is called before accepting a message; if any thresholds are
215set, it checks them. If a message_size is supplied, it checks that there is
216enough space for that size plus the threshold - i.e. that the message won't
217reduce the space to the threshold. Not all OS have statvfs(); for those that
218don't, this function always returns TRUE. For some OS the old function and
219struct name statfs is used; that is handled by a macro, defined in exim.h.
220
221Arguments:
222 msg_size the (estimated) size of an incoming message
223
224Returns: FALSE if there isn't enough space, or if the information cannot
225 be obtained
226 TRUE if no check was done or there is enough space
227*/
228
229BOOL
230receive_check_fs(int msg_size)
231{
232int space, inodes;
233
234if (check_spool_space > 0 || msg_size > 0 || check_spool_inodes > 0)
235 {
8e669ac1
PH
236 space = receive_statvfs(TRUE, &inodes);
237
059ec3d9 238 DEBUG(D_receive)
5cb8cbc6
PH
239 debug_printf("spool directory space = %dK inodes = %d "
240 "check_space = %dK inodes = %d msg_size = %d\n",
241 space, inodes, check_spool_space, check_spool_inodes, msg_size);
8e669ac1
PH
242
243 if ((space >= 0 && space < check_spool_space) ||
5cb8cbc6 244 (inodes >= 0 && inodes < check_spool_inodes))
8e669ac1 245 {
5cb8cbc6
PH
246 log_write(0, LOG_MAIN, "spool directory space check failed: space=%d "
247 "inodes=%d", space, inodes);
059ec3d9
PH
248 return FALSE;
249 }
250 }
251
5cb8cbc6
PH
252if (check_log_space > 0 || check_log_inodes > 0)
253 {
8e669ac1
PH
254 space = receive_statvfs(FALSE, &inodes);
255
5cb8cbc6
PH
256 DEBUG(D_receive)
257 debug_printf("log directory space = %dK inodes = %d "
258 "check_space = %dK inodes = %d\n",
259 space, inodes, check_log_space, check_log_inodes);
8e669ac1
PH
260
261 if ((space >= 0 && space < check_log_space) ||
5cb8cbc6 262 (inodes >= 0 && inodes < check_log_inodes))
8e669ac1 263 {
5cb8cbc6
PH
264 log_write(0, LOG_MAIN, "log directory space check failed: space=%d "
265 "inodes=%d", space, inodes);
266 return FALSE;
267 }
8e669ac1
PH
268 }
269
059ec3d9
PH
270return TRUE;
271}
272
273
274
275/*************************************************
276* Bomb out while reading a message *
277*************************************************/
278
279/* The common case of wanting to bomb out is if a SIGTERM or SIGINT is
280received, or if there is a timeout. A rarer case might be if the log files are
281screwed up and Exim can't open them to record a message's arrival. Handling
282that case is done by setting a flag to cause the log functions to call this
283function if there is an ultimate disaster. That is why it is globally
284accessible.
285
286Arguments: SMTP response to give if in an SMTP session
287Returns: it doesn't
288*/
289
290void
291receive_bomb_out(uschar *msg)
292{
293/* If spool_name is set, it contains the name of the data file that is being
294written. Unlink it before closing so that it cannot be picked up by a delivery
295process. Ensure that any header file is also removed. */
296
297if (spool_name[0] != 0)
298 {
299 Uunlink(spool_name);
300 spool_name[Ustrlen(spool_name) - 1] = 'H';
301 Uunlink(spool_name);
302 }
303
304/* Now close the file if it is open, either as a fd or a stream. */
305
f1e894f3
PH
306if (data_file != NULL) (void)fclose(data_file);
307 else if (data_fd >= 0) (void)close(data_fd);
059ec3d9
PH
308
309/* Attempt to close down an SMTP connection tidily. */
310
311if (smtp_input)
312 {
313 if (!smtp_batched_input)
314 {
315 smtp_printf("421 %s %s - closing connection.\r\n", smtp_active_hostname,
316 msg);
317 mac_smtp_fflush();
318 }
319
320 /* Control does not return from moan_smtp_batch(). */
321
322 else moan_smtp_batch(NULL, "421 %s - message abandoned", msg);
323 }
324
325/* Exit from the program (non-BSMTP cases) */
326
327exim_exit(EXIT_FAILURE);
328}
329
330
331/*************************************************
332* Data read timeout *
333*************************************************/
334
335/* Handler function for timeouts that occur while reading the data that
336comprises a message.
337
338Argument: the signal number
339Returns: nothing
340*/
341
342static void
343data_timeout_handler(int sig)
344{
345uschar *msg = NULL;
346
347sig = sig; /* Keep picky compilers happy */
348
349if (smtp_input)
350 {
351 msg = US"SMTP incoming data timeout";
352 log_write(L_lost_incoming_connection,
353 LOG_MAIN, "SMTP data timeout (message abandoned) on connection "
fed77020
PH
354 "from %s F=<%s>",
355 (sender_fullhost != NULL)? sender_fullhost : US"local process",
356 sender_address);
059ec3d9
PH
357 }
358else
359 {
360 fprintf(stderr, "exim: timed out while reading - message abandoned\n");
361 log_write(L_lost_incoming_connection,
362 LOG_MAIN, "timed out while reading local message");
363 }
364
365receive_bomb_out(msg); /* Does not return */
366}
367
368
369
370/*************************************************
371* local_scan() timeout *
372*************************************************/
373
374/* Handler function for timeouts that occur while running a local_scan()
375function.
376
377Argument: the signal number
378Returns: nothing
379*/
380
381static void
382local_scan_timeout_handler(int sig)
383{
384sig = sig; /* Keep picky compilers happy */
385log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function timed out - "
386 "message temporarily rejected (size %d)", message_size);
387receive_bomb_out(US"local verification problem"); /* Does not return */
388}
389
390
391
392/*************************************************
393* local_scan() crashed *
394*************************************************/
395
396/* Handler function for signals that occur while running a local_scan()
397function.
398
399Argument: the signal number
400Returns: nothing
401*/
402
403static void
404local_scan_crash_handler(int sig)
405{
406log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function crashed with "
407 "signal %d - message temporarily rejected (size %d)", sig, message_size);
408receive_bomb_out(US"local verification problem"); /* Does not return */
409}
410
411
412/*************************************************
413* SIGTERM or SIGINT received *
414*************************************************/
415
416/* Handler for SIGTERM or SIGINT signals that occur while reading the
417data that comprises a message.
418
419Argument: the signal number
420Returns: nothing
421*/
422
423static void
424data_sigterm_sigint_handler(int sig)
425{
426uschar *msg = NULL;
427
428if (smtp_input)
429 {
430 msg = US"Service not available - SIGTERM or SIGINT received";
431 log_write(0, LOG_MAIN, "%s closed after %s", smtp_get_connection_info(),
432 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
433 }
434else
435 {
f05da2e8 436 if (filter_test == FTEST_NONE)
059ec3d9
PH
437 {
438 fprintf(stderr, "\nexim: %s received - message abandoned\n",
439 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
440 log_write(0, LOG_MAIN, "%s received while reading local message",
441 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
442 }
443 }
444
445receive_bomb_out(msg); /* Does not return */
446}
447
448
449
450/*************************************************
451* Add new recipient to list *
452*************************************************/
453
454/* This function builds a list of recipient addresses in argc/argv
455format.
456
457Arguments:
458 recipient the next address to add to recipients_list
459 pno parent number for fixed aliases; -1 otherwise
460
461Returns: nothing
462*/
463
464void
465receive_add_recipient(uschar *recipient, int pno)
466{
467if (recipients_count >= recipients_list_max)
468 {
469 recipient_item *oldlist = recipients_list;
470 int oldmax = recipients_list_max;
471 recipients_list_max = recipients_list_max? 2*recipients_list_max : 50;
472 recipients_list = store_get(recipients_list_max * sizeof(recipient_item));
473 if (oldlist != NULL)
474 memcpy(recipients_list, oldlist, oldmax * sizeof(recipient_item));
475 }
476
477recipients_list[recipients_count].address = recipient;
478recipients_list[recipients_count].pno = pno;
8523533c
TK
479#ifdef EXPERIMENTAL_BRIGHTMAIL
480recipients_list[recipients_count].bmi_optin = bmi_current_optin;
481/* reset optin string pointer for next recipient */
482bmi_current_optin = NULL;
483#endif
059ec3d9
PH
484recipients_list[recipients_count++].errors_to = NULL;
485}
486
487
488
489
490/*************************************************
491* Remove a recipient from the list *
492*************************************************/
493
494/* This function is provided for local_scan() to use.
495
496Argument:
497 recipient address to remove
498
499Returns: TRUE if it did remove something; FALSE otherwise
500*/
501
502BOOL
503receive_remove_recipient(uschar *recipient)
504{
505int count;
506DEBUG(D_receive) debug_printf("receive_remove_recipient(\"%s\") called\n",
507 recipient);
508for (count = 0; count < recipients_count; count++)
509 {
510 if (Ustrcmp(recipients_list[count].address, recipient) == 0)
511 {
512 if ((--recipients_count - count) > 0)
513 memmove(recipients_list + count, recipients_list + count + 1,
54cdb463 514 (recipients_count - count)*sizeof(recipient_item));
059ec3d9
PH
515 return TRUE;
516 }
517 }
518return FALSE;
519}
520
521
522
523
524
525/*************************************************
526* Read data portion of a non-SMTP message *
527*************************************************/
528
529/* This function is called to read the remainder of a message (following the
530header) when the input is not from SMTP - we are receiving a local message on
531a standard input stream. The message is always terminated by EOF, and is also
532terminated by a dot on a line by itself if the flag dot_ends is TRUE. Split the
533two cases for maximum efficiency.
534
535Ensure that the body ends with a newline. This will naturally be the case when
536the termination is "\n.\n" but may not be otherwise. The RFC defines messages
537as "sequences of lines" - this of course strictly applies only to SMTP, but
538deliveries into BSD-type mailbox files also require it. Exim used to have a
539flag for doing this at delivery time, but as it was always set for all
540transports, I decided to simplify things by putting the check here instead.
541
542There is at least one MUA (dtmail) that sends CRLF via this interface, and
543other programs are known to do this as well. Exim used to have a option for
544dealing with this: in July 2003, after much discussion, the code has been
545changed to default to treat any of LF, CRLF, and bare CR as line terminators.
546
547However, for the case when a dot on a line by itself terminates a message, the
548only recognized terminating sequences before and after the dot are LF and CRLF.
549Otherwise, having read EOL . CR, you don't know whether to read another
550character or not.
551
552Internally, in messages stored in Exim's spool files, LF is used as the line
553terminator. Under the new regime, bare CRs will no longer appear in these
554files.
555
556Arguments:
557 fout a FILE to which to write the message
558
559Returns: One of the END_xxx values indicating why it stopped reading
560*/
561
562static int
563read_message_data(FILE *fout)
564{
565int ch_state;
566register int ch;
567
568/* Handle the case when only EOF terminates the message */
569
570if (!dot_ends)
571 {
572 register int last_ch = '\n';
573
fb2274d4 574 for (; (ch = (RECEIVE_GETC)()) != EOF; last_ch = ch)
059ec3d9
PH
575 {
576 if (ch == 0) body_zerocount++;
577 if (last_ch == '\r' && ch != '\n')
578 {
579 if (fputc('\n', fout) == EOF) return END_WERROR;
580 message_size++;
581 body_linecount++;
582 }
583 if (ch == '\r') continue;
584
585 if (fputc(ch, fout) == EOF) return END_WERROR;
586 if (ch == '\n') body_linecount++;
587 if (++message_size > thismessage_size_limit) return END_SIZE;
588 }
589
590 if (last_ch != '\n')
591 {
592 if (fputc('\n', fout) == EOF) return END_WERROR;
593 message_size++;
594 body_linecount++;
595 }
596
597 return END_EOF;
598 }
599
600/* Handle the case when a dot on a line on its own, or EOF, terminates. */
601
602ch_state = 1;
603
fb2274d4 604while ((ch = (RECEIVE_GETC)()) != EOF)
059ec3d9
PH
605 {
606 if (ch == 0) body_zerocount++;
607 switch (ch_state)
608 {
609 case 0: /* Normal state (previous char written) */
610 if (ch == '\n')
611 { body_linecount++; ch_state = 1; }
612 else if (ch == '\r')
613 { ch_state = 2; continue; }
614 break;
615
616 case 1: /* After written "\n" */
617 if (ch == '.') { ch_state = 3; continue; }
618 if (ch != '\n') ch_state = 0;
619 break;
620
621 case 2:
622 body_linecount++; /* After unwritten "\r" */
623 if (ch == '\n')
624 { ch_state = 1; }
625 else
626 {
627 if (message_size++, fputc('\n', fout) == EOF) return END_WERROR;
628 if (ch == '\r') continue;
629 ch_state = 0;
630 }
631 break;
632
633 case 3: /* After "\n." (\n written, dot not) */
634 if (ch == '\n') return END_DOT;
635 if (ch == '\r') { ch_state = 4; continue; }
636 message_size++;
637 if (fputc('.', fout) == EOF) return END_WERROR;
638 ch_state = 0;
639 break;
640
641 case 4: /* After "\n.\r" (\n written, rest not) */
642 if (ch == '\n') return END_DOT;
643 message_size += 2;
644 body_linecount++;
645 if (fputs(".\n", fout) == EOF) return END_WERROR;
646 if (ch == '\r') { ch_state = 2; continue; }
647 ch_state = 0;
648 break;
649 }
650
651 if (fputc(ch, fout) == EOF) return END_WERROR;
652 if (++message_size > thismessage_size_limit) return END_SIZE;
653 }
654
655/* Get here if EOF read. Unless we have just written "\n", we need to ensure
656the message ends with a newline, and we must also write any characters that
657were saved up while testing for an ending dot. */
658
659if (ch_state != 1)
660 {
661 static uschar *ends[] = { US"\n", NULL, US"\n", US".\n", US".\n" };
662 if (fputs(CS ends[ch_state], fout) == EOF) return END_WERROR;
663 message_size += Ustrlen(ends[ch_state]);
664 body_linecount++;
665 }
666
667return END_EOF;
668}
669
670
671
672
673/*************************************************
674* Read data portion of an SMTP message *
675*************************************************/
676
677/* This function is called to read the remainder of an SMTP message (after the
678headers), or to skip over it when an error has occurred. In this case, the
679output file is passed as NULL.
680
681If any line begins with a dot, that character is skipped. The input should only
682be successfully terminated by CR LF . CR LF unless it is local (non-network)
683SMTP, in which case the CRs are optional, but...
684
685FUDGE: It seems that sites on the net send out messages with just LF
686terminators, despite the warnings in the RFCs, and other MTAs handle this. So
687we make the CRs optional in all cases.
688
689July 2003: Bare CRs cause trouble. We now treat them as line terminators as
690well, so that there are no CRs in spooled messages. However, the message
691terminating dot is not recognized between two bare CRs.
692
693Arguments:
694 fout a FILE to which to write the message; NULL if skipping
695
696Returns: One of the END_xxx values indicating why it stopped reading
697*/
698
699static int
700read_message_data_smtp(FILE *fout)
701{
702int ch_state = 0;
703register int ch;
704
fb2274d4 705while ((ch = (RECEIVE_GETC)()) != EOF)
059ec3d9
PH
706 {
707 if (ch == 0) body_zerocount++;
708 switch (ch_state)
709 {
710 case 0: /* After LF or CRLF */
711 if (ch == '.')
712 {
713 ch_state = 3;
714 continue; /* Don't ever write . after LF */
715 }
716 ch_state = 1;
717
718 /* Else fall through to handle as normal uschar. */
719
720 case 1: /* Normal state */
721 if (ch == '\n')
722 {
723 ch_state = 0;
724 body_linecount++;
725 }
726 else if (ch == '\r')
727 {
728 ch_state = 2;
729 continue;
730 }
731 break;
732
733 case 2: /* After (unwritten) CR */
734 body_linecount++;
735 if (ch == '\n')
736 {
737 ch_state = 0;
738 }
739 else
740 {
741 message_size++;
742 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
743 if (ch != '\r') ch_state = 1; else continue;
744 }
745 break;
746
747 case 3: /* After [CR] LF . */
748 if (ch == '\n')
749 return END_DOT;
750 if (ch == '\r')
751 {
752 ch_state = 4;
753 continue;
754 }
755 ch_state = 1; /* The dot itself is removed */
756 break;
757
758 case 4: /* After [CR] LF . CR */
759 if (ch == '\n') return END_DOT;
760 message_size++;
761 body_linecount++;
762 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
763 if (ch == '\r')
764 {
765 ch_state = 2;
766 continue;
767 }
768 ch_state = 1;
769 break;
770 }
771
772 /* Add the character to the spool file, unless skipping; then loop for the
773 next. */
774
775 message_size++;
776 if (fout != NULL)
777 {
778 if (fputc(ch, fout) == EOF) return END_WERROR;
779 if (message_size > thismessage_size_limit) return END_SIZE;
780 }
781 }
782
783/* Fall through here if EOF encountered. This indicates some kind of error,
784since a correct message is terminated by [CR] LF . [CR] LF. */
785
786return END_EOF;
787}
788
789
790
791
792/*************************************************
793* Swallow SMTP message *
794*************************************************/
795
796/* This function is called when there has been some kind of error while reading
797an SMTP message, and the remaining data may need to be swallowed. It is global
798because it is called from smtp_closedown() to shut down an incoming call
799tidily.
800
801Argument: a FILE from which to read the message
802Returns: nothing
803*/
804
805void
806receive_swallow_smtp(void)
807{
808if (message_ended >= END_NOTENDED)
809 message_ended = read_message_data_smtp(NULL);
810}
811
812
813
814/*************************************************
815* Handle lost SMTP connection *
816*************************************************/
817
818/* This function logs connection loss incidents and generates an appropriate
819SMTP response.
820
821Argument: additional data for the message
822Returns: the SMTP response
823*/
824
825static uschar *
826handle_lost_connection(uschar *s)
827{
828log_write(L_lost_incoming_connection | L_smtp_connection, LOG_MAIN,
829 "%s lost while reading message data%s", smtp_get_connection_info(), s);
830return US"421 Lost incoming connection";
831}
832
833
834
835
836/*************************************************
837* Handle a non-smtp reception error *
838*************************************************/
839
840/* This function is called for various errors during the reception of non-SMTP
841messages. It either sends a message to the sender of the problem message, or it
842writes to the standard error stream.
843
844Arguments:
845 errcode code for moan_to_sender(), identifying the error
846 text1 first message text, passed to moan_to_sender()
847 text2 second message text, used only for stderrr
848 error_rc code to pass to exim_exit if no problem
849 f FILE containing body of message (may be stdin)
850 hptr pointer to instore headers or NULL
851
852Returns: calls exim_exit(), which does not return
853*/
854
855static void
856give_local_error(int errcode, uschar *text1, uschar *text2, int error_rc,
857 FILE *f, header_line *hptr)
858{
859if (error_handling == ERRORS_SENDER)
860 {
861 error_block eblock;
862 eblock.next = NULL;
863 eblock.text1 = text1;
864 if (!moan_to_sender(errcode, &eblock, hptr, f, FALSE))
865 error_rc = EXIT_FAILURE;
866 }
867else fprintf(stderr, "exim: %s%s\n", text2, text1); /* Sic */
f1e894f3 868(void)fclose(f);
059ec3d9
PH
869exim_exit(error_rc);
870}
871
872
873
874/*************************************************
875* Add header lines set up by ACL *
876*************************************************/
877
878/* This function is called to add the header lines that were set up by "warn"
879statements in an ACL onto the list of headers in memory. It is done in two
880stages like this, because when the ACL for RCPT is running, the other headers
881have not yet been received. This function is called twice; once just before
882running the DATA ACL, and once after. This is so that header lines added by
883MAIL or RCPT are visible to the DATA ACL.
884
885Originally these header lines were added at the end. Now there is support for
886three different places: top, bottom, and after the Received: header(s). There
887will always be at least one Received: header, even if it is marked deleted, and
888even if something else has been put in front of it.
889
890Arguments:
891 acl_name text to identify which ACL
892
893Returns: nothing
894*/
895
896static void
897add_acl_headers(uschar *acl_name)
898{
899header_line *h, *next;
900header_line *last_received = NULL;
901
902if (acl_warn_headers == NULL) return;
903DEBUG(D_receive|D_acl) debug_printf(">>Headers added by %s ACL:\n", acl_name);
904
905for (h = acl_warn_headers; h != NULL; h = next)
906 {
907 next = h->next;
908
909 switch(h->type)
910 {
911 case htype_add_top:
912 h->next = header_list;
913 header_list = h;
914 DEBUG(D_receive|D_acl) debug_printf(" (at top)");
915 break;
916
917 case htype_add_rec:
918 if (last_received == NULL)
919 {
920 last_received = header_list;
921 while (!header_testname(last_received, US"Received", 8, FALSE))
922 last_received = last_received->next;
923 while (last_received->next != NULL &&
924 header_testname(last_received->next, US"Received", 8, FALSE))
925 last_received = last_received->next;
926 }
927 h->next = last_received->next;
928 last_received->next = h;
929 DEBUG(D_receive|D_acl) debug_printf(" (after Received:)");
930 break;
931
8523533c
TK
932 case htype_add_rfc:
933 /* add header before any header which is NOT Received: or Resent- */
934 last_received = header_list;
935 while ( (last_received->next != NULL) &&
936 ( (header_testname(last_received->next, US"Received", 8, FALSE)) ||
937 (header_testname_incomplete(last_received->next, US"Resent-", 7, FALSE)) ) )
938 last_received = last_received->next;
939 /* last_received now points to the last Received: or Resent-* header
940 in an uninterrupted chain of those header types (seen from the beginning
941 of all headers. Our current header must follow it. */
942 h->next = last_received->next;
943 last_received->next = h;
8e669ac1 944 DEBUG(D_receive|D_acl) debug_printf(" (before any non-Received: or Resent-*: header)");
8523533c
TK
945 break;
946
059ec3d9
PH
947 default:
948 h->next = NULL;
949 header_last->next = h;
950 break;
951 }
952
953 if (h->next == NULL) header_last = h;
954
955 /* Check for one of the known header types (From:, To:, etc.) though in
956 practice most added headers are going to be "other". Lower case
957 identification letters are never stored with the header; they are used
958 for existence tests when messages are received. So discard any lower case
959 flag values. */
960
961 h->type = header_checkname(h, FALSE);
962 if (h->type >= 'a') h->type = htype_other;
963
964 DEBUG(D_receive|D_acl) debug_printf(" %s", header_last->text);
965 }
966
967acl_warn_headers = NULL;
968DEBUG(D_receive|D_acl) debug_printf(">>\n");
969}
970
971
972
973/*************************************************
974* Add host information for log line *
975*************************************************/
976
977/* Called for acceptance and rejecting log lines. This adds information about
978the calling host to a string that is being built dynamically.
979
980Arguments:
981 s the dynamic string
982 sizeptr points to the size variable
983 ptrptr points to the pointer variable
984
985Returns: the extended string
986*/
987
988static uschar *
989add_host_info_for_log(uschar *s, int *sizeptr, int *ptrptr)
990{
991if (sender_fullhost != NULL)
992 {
993 s = string_append(s, sizeptr, ptrptr, 2, US" H=", sender_fullhost);
994 if ((log_extra_selector & LX_incoming_interface) != 0 &&
995 interface_address != NULL)
996 {
997 uschar *ss = string_sprintf(" I=[%s]:%d", interface_address,
998 interface_port);
999 s = string_cat(s, sizeptr, ptrptr, ss, Ustrlen(ss));
1000 }
1001 }
1002if (sender_ident != NULL)
1003 s = string_append(s, sizeptr, ptrptr, 2, US" U=", sender_ident);
1004if (received_protocol != NULL)
1005 s = string_append(s, sizeptr, ptrptr, 2, US" P=", received_protocol);
1006return s;
1007}
1008
1009
1010
63955bf2 1011#ifdef WITH_CONTENT_SCAN
059ec3d9
PH
1012
1013/*************************************************
54cdb463
PH
1014* Run the MIME ACL on a message *
1015*************************************************/
1016
1017/* This code is in a subroutine so that it can be used for both SMTP
1018and non-SMTP messages. It is called with a non-NULL ACL pointer.
1019
1020Arguments:
1021 acl The ACL to run (acl_smtp_mime or acl_not_smtp_mime)
1022 smtp_yield_ptr Set FALSE to kill messages after dropped connection
1023 smtp_reply_ptr Where SMTP reply is being built
1024 blackholed_by_ptr Where "blackholed by" message is being built
1025
1026Returns: TRUE to carry on; FALSE to abandon the message
1027*/
1028
1029static BOOL
1030run_mime_acl(uschar *acl, BOOL *smtp_yield_ptr, uschar **smtp_reply_ptr,
1031 uschar **blackholed_by_ptr)
1032{
1033FILE *mbox_file;
1034uschar rfc822_file_path[2048];
1035unsigned long mbox_size;
1036header_line *my_headerlist;
1037uschar *user_msg, *log_msg;
1038int mime_part_count_buffer = -1;
1039int rc;
1040
1041memset(CS rfc822_file_path,0,2048);
1042
1043/* check if it is a MIME message */
1044my_headerlist = header_list;
1045while (my_headerlist != NULL) {
1046 /* skip deleted headers */
1047 if (my_headerlist->type == '*') {
1048 my_headerlist = my_headerlist->next;
1049 continue;
1050 };
1051 if (strncmpic(my_headerlist->text, US"Content-Type:", 13) == 0) {
1052 DEBUG(D_receive) debug_printf("Found Content-Type: header - executing acl_smtp_mime.\n");
1053 goto DO_MIME_ACL;
1054 };
1055 my_headerlist = my_headerlist->next;
1056};
1057
1058DEBUG(D_receive) debug_printf("No Content-Type: header - presumably not a MIME message.\n");
1059return TRUE;
1060
1061DO_MIME_ACL:
1062/* make sure the eml mbox file is spooled up */
1063mbox_file = spool_mbox(&mbox_size);
1064if (mbox_file == NULL) {
1065 /* error while spooling */
1066 log_write(0, LOG_MAIN|LOG_PANIC,
1067 "acl_smtp_mime: error while creating mbox spool file, message temporarily rejected.");
1068 Uunlink(spool_name);
1069 unspool_mbox();
1070 smtp_respond(451, TRUE, US"temporary local problem");
1071 message_id[0] = 0; /* Indicate no message accepted */
1072 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1073 return FALSE; /* Indicate skip to end of receive function */
1074};
1075
1076mime_is_rfc822 = 0;
1077
1078MIME_ACL_CHECK:
1079mime_part_count = -1;
1080rc = mime_acl_check(acl, mbox_file, NULL, &user_msg, &log_msg);
f1e894f3 1081(void)fclose(mbox_file);
54cdb463
PH
1082
1083if (Ustrlen(rfc822_file_path) > 0) {
1084 mime_part_count = mime_part_count_buffer;
1085
1086 if (unlink(CS rfc822_file_path) == -1) {
1087 log_write(0, LOG_PANIC,
1088 "acl_smtp_mime: can't unlink RFC822 spool file, skipping.");
1089 goto END_MIME_ACL;
1090 };
1091};
1092
1093/* check if we must check any message/rfc822 attachments */
1094if (rc == OK) {
1095 uschar temp_path[1024];
1096 int n;
1097 struct dirent *entry;
1098 DIR *tempdir;
1099
b07e6aa3
PH
1100 (void)string_format(temp_path, 1024, "%s/scan/%s", spool_directory,
1101 message_id);
54cdb463
PH
1102
1103 tempdir = opendir(CS temp_path);
1104 n = 0;
1105 do {
1106 entry = readdir(tempdir);
1107 if (entry == NULL) break;
1108 if (strncmpic(US entry->d_name,US"__rfc822_",9) == 0) {
b07e6aa3 1109 (void)string_format(rfc822_file_path, 2048,"%s/scan/%s/%s", spool_directory, message_id, entry->d_name);
54cdb463
PH
1110 debug_printf("RFC822 attachment detected: running MIME ACL for '%s'\n", rfc822_file_path);
1111 break;
1112 };
1113 } while (1);
1114 closedir(tempdir);
1115
1116 if (entry != NULL) {
c58b88df 1117 mbox_file = Ufopen(rfc822_file_path,"rb");
54cdb463
PH
1118 if (mbox_file == NULL) {
1119 log_write(0, LOG_PANIC,
1120 "acl_smtp_mime: can't open RFC822 spool file, skipping.");
1121 unlink(CS rfc822_file_path);
1122 goto END_MIME_ACL;
1123 };
1124 /* set RFC822 expansion variable */
1125 mime_is_rfc822 = 1;
1126 mime_part_count_buffer = mime_part_count;
1127 goto MIME_ACL_CHECK;
1128 };
1129};
1130
1131END_MIME_ACL:
1132add_acl_headers(US"MIME");
1133if (rc == DISCARD)
1134 {
1135 recipients_count = 0;
1136 *blackholed_by_ptr = US"MIME ACL";
1137 }
1138else if (rc != OK)
1139 {
1140 Uunlink(spool_name);
1141 unspool_mbox();
1142 if (smtp_handle_acl_fail(ACL_WHERE_MIME, rc, user_msg, log_msg) != 0)
1143 *smtp_yield_ptr = FALSE; /* No more messsages after dropped connection */
1144 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1145 message_id[0] = 0; /* Indicate no message accepted */
1146 return FALSE; /* Cause skip to end of receive function */
1147 };
1148
1149return TRUE;
1150}
1151
63955bf2 1152#endif /* WITH_CONTENT_SCAN */
54cdb463
PH
1153
1154
1155/*************************************************
059ec3d9
PH
1156* Receive message *
1157*************************************************/
1158
1159/* Receive a message on the given input, and put it into a pair of spool files.
1160Either a non-null list of recipients, or the extract flag will be true, or
1161both. The flag sender_local is true for locally generated messages. The flag
1162submission_mode is true if an ACL has obeyed "control = submission". The flag
8800895a
PH
1163suppress_local_fixups is true if an ACL has obeyed "control =
1164suppress_local_fixups". The flag smtp_input is true if the message is to be
1165handled using SMTP conventions about termination and lines starting with dots.
1166For non-SMTP messages, dot_ends is true for dot-terminated messages.
059ec3d9
PH
1167
1168If a message was successfully read, message_id[0] will be non-zero.
1169
1170The general actions of this function are:
1171
1172 . Read the headers of the message (if any) into a chain of store
1173 blocks.
1174
1175 . If there is a "sender:" header and the message is locally originated,
69358f02
PH
1176 throw it away, unless the caller is trusted, or unless
1177 active_local_sender_retain is set - which can only happen if
1178 active_local_from_check is false.
059ec3d9
PH
1179
1180 . If recipients are to be extracted from the message, build the
1181 recipients list from the headers, removing any that were on the
1182 original recipients list (unless extract_addresses_remove_arguments is
1183 false), and at the same time, remove any bcc header that may be present.
1184
1185 . Get the spool file for the data, sort out its unique name, open
1186 and lock it (but don't give it the name yet).
1187
1188 . Generate a "Message-Id" header if the message doesn't have one, for
1189 locally-originated messages.
1190
1191 . Generate a "Received" header.
1192
1193 . Ensure the recipients list is fully qualified and rewritten if necessary.
1194
1195 . If there are any rewriting rules, apply them to the sender address
1196 and also to the headers.
1197
1198 . If there is no from: header, generate one, for locally-generated messages
1199 and messages in "submission mode" only.
1200
1201 . If the sender is local, check that from: is correct, and if not, generate
1202 a Sender: header, unless message comes from a trusted caller, or this
69358f02 1203 feature is disabled by active_local_from_check being false.
059ec3d9
PH
1204
1205 . If there is no "date" header, generate one, for locally-originated
1206 or submission mode messages only.
1207
1208 . Copy the rest of the input, or up to a terminating "." if in SMTP or
1209 dot_ends mode, to the data file. Leave it open, to hold the lock.
1210
1211 . Write the envelope and the headers to a new file.
1212
1213 . Set the name for the header file; close it.
1214
1215 . Set the name for the data file; close it.
1216
1217Because this function can potentially be called many times in a single
1218SMTP connection, all store should be got by store_get(), so that it will be
1219automatically retrieved after the message is accepted.
1220
1221FUDGE: It seems that sites on the net send out messages with just LF
1222terminators, despite the warnings in the RFCs, and other MTAs handle this. So
1223we make the CRs optional in all cases.
1224
1225July 2003: Bare CRs in messages, especially in header lines, cause trouble. A
1226new regime is now in place in which bare CRs in header lines are turned into LF
1227followed by a space, so as not to terminate the header line.
1228
1229February 2004: A bare LF in a header line in a message whose first line was
1230terminated by CRLF is treated in the same way as a bare CR.
1231
1232Arguments:
1233 extract_recip TRUE if recipients are to be extracted from the message's
1234 headers
1235
1236Returns: TRUE there are more messages to be read (SMTP input)
1237 FALSE there are no more messages to be read (non-SMTP input
1238 or SMTP connection collapsed, or other failure)
1239
1240When reading a message for filter testing, the returned value indicates
1241whether the headers (which is all that is read) were terminated by '.' or
1242not. */
1243
1244BOOL
1245receive_msg(BOOL extract_recip)
1246{
1247int i, rc;
1248int msg_size = 0;
1249int process_info_len = Ustrlen(process_info);
1250int error_rc = (error_handling == ERRORS_SENDER)?
1251 errors_sender_rc : EXIT_FAILURE;
1252int header_size = 256;
1253int start, end, domain, size, sptr;
1254int id_resolution;
1255int had_zero = 0;
1256
1257register int ptr = 0;
1258
1259BOOL contains_resent_headers = FALSE;
1260BOOL extracted_ignored = FALSE;
1261BOOL first_line_ended_crlf = TRUE_UNSET;
1262BOOL smtp_yield = TRUE;
1263BOOL yield = FALSE;
1264
1265BOOL resents_exist = FALSE;
1266uschar *resent_prefix = US"";
1267uschar *blackholed_by = NULL;
04f7d5b9 1268uschar *blackhole_log_msg = US"";
059ec3d9
PH
1269
1270flock_t lock_data;
1271error_block *bad_addresses = NULL;
1272
1273uschar *frozen_by = NULL;
1274uschar *queued_by = NULL;
1275
1276uschar *errmsg, *s;
1277struct stat statbuf;
1278
1279/* Final message to give to SMTP caller */
1280
1281uschar *smtp_reply = NULL;
1282
1283/* Working header pointers */
1284
1285header_line *h, *next;
1286
2cbb4081 1287/* Flags for noting the existence of certain headers (only one left) */
059ec3d9
PH
1288
1289BOOL date_header_exists = FALSE;
1290
1291/* Pointers to receive the addresses of headers whose contents we need. */
1292
1293header_line *from_header = NULL;
1294header_line *subject_header = NULL;
1295header_line *msgid_header = NULL;
1296header_line *received_header;
1297
1298/* Variables for use when building the Received: header. */
1299
1300uschar *received;
1301uschar *timestamp;
1302int tslen;
1303
1304/* Release any open files that might have been cached while preparing to
1305accept the message - e.g. by verifying addresses - because reading a message
1306might take a fair bit of real time. */
1307
1308search_tidyup();
1309
1310/* Initialize the chain of headers by setting up a place-holder for Received:
1311header. Temporarily mark it as "old", i.e. not to be used. We keep header_last
1312pointing to the end of the chain to make adding headers simple. */
1313
1314received_header = header_list = header_last = store_get(sizeof(header_line));
1315header_list->next = NULL;
1316header_list->type = htype_old;
1317header_list->text = NULL;
1318header_list->slen = 0;
1319
1320/* Control block for the next header to be read. */
1321
1322next = store_get(sizeof(header_line));
1323next->text = store_get(header_size);
1324
1325/* Initialize message id to be null (indicating no message read), and the
1326header names list to be the normal list. Indicate there is no data file open
1327yet, initialize the size and warning count, and deal with no size limit. */
1328
1329message_id[0] = 0;
1330data_file = NULL;
1331data_fd = -1;
1332spool_name[0] = 0;
1333message_size = 0;
1334warning_count = 0;
1335received_count = 1; /* For the one we will add */
1336
1337if (thismessage_size_limit <= 0) thismessage_size_limit = INT_MAX;
1338
2e0c1448 1339/* While reading the message, the following counts are computed. */
059ec3d9 1340
2e0c1448 1341message_linecount = body_linecount = body_zerocount = 0;
059ec3d9 1342
fb2274d4
TK
1343#ifdef EXPERIMENTAL_DOMAINKEYS
1344/* Call into DK to set up the context. Check if DK is to be run are carried out
1345 inside dk_exim_verify_init(). */
1346dk_exim_verify_init();
1347#endif
1348
059ec3d9
PH
1349/* Remember the time of reception. Exim uses time+pid for uniqueness of message
1350ids, and fractions of a second are required. See the comments that precede the
1351message id creation below. */
1352
1353(void)gettimeofday(&message_id_tv, NULL);
1354
1355/* For other uses of the received time we can operate with granularity of one
1356second, and for that we use the global variable received_time. This is for
1357things like ultimate message timeouts. */
1358
1359received_time = message_id_tv.tv_sec;
1360
1361/* If SMTP input, set the special handler for timeouts. The alarm() calls
1362happen in the smtp_getc() function when it refills its buffer. */
1363
1364if (smtp_input) os_non_restarting_signal(SIGALRM, data_timeout_handler);
1365
1366/* If not SMTP input, timeout happens only if configured, and we just set a
1367single timeout for the whole message. */
1368
1369else if (receive_timeout > 0)
1370 {
1371 os_non_restarting_signal(SIGALRM, data_timeout_handler);
1372 alarm(receive_timeout);
1373 }
1374
1375/* SIGTERM and SIGINT are caught always. */
1376
1377signal(SIGTERM, data_sigterm_sigint_handler);
1378signal(SIGINT, data_sigterm_sigint_handler);
1379
1380/* Header lines in messages are not supposed to be very long, though when
1381unfolded, to: and cc: headers can take up a lot of store. We must also cope
1382with the possibility of junk being thrown at us. Start by getting 256 bytes for
1383storing the header, and extend this as necessary using string_cat().
1384
1385To cope with total lunacies, impose an upper limit on the length of the header
1386section of the message, as otherwise the store will fill up. We must also cope
1387with the possibility of binary zeros in the data. Hence we cannot use fgets().
1388Folded header lines are joined into one string, leaving the '\n' characters
1389inside them, so that writing them out reproduces the input.
1390
1391Loop for each character of each header; the next structure for chaining the
1392header is set up already, with ptr the offset of the next character in
1393next->text. */
1394
1395for (;;)
1396 {
fb2274d4 1397 int ch = (RECEIVE_GETC)();
059ec3d9
PH
1398
1399 /* If we hit EOF on a SMTP connection, it's an error, since incoming
1400 SMTP must have a correct "." terminator. */
1401
1402 if (ch == EOF && smtp_input /* && !smtp_batched_input */)
1403 {
1404 smtp_reply = handle_lost_connection(US" (header)");
1405 smtp_yield = FALSE;
1406 goto TIDYUP; /* Skip to end of function */
1407 }
1408
1409 /* See if we are at the current header's size limit - there must be at least
1410 four bytes left. This allows for the new character plus a zero, plus two for
1411 extra insertions when we are playing games with dots and carriage returns. If
1412 we are at the limit, extend the text buffer. This could have been done
1413 automatically using string_cat() but because this is a tightish loop storing
1414 only one character at a time, we choose to do it inline. Normally
1415 store_extend() will be able to extend the block; only at the end of a big
1416 store block will a copy be needed. To handle the case of very long headers
1417 (and sometimes lunatic messages can have ones that are 100s of K long) we
1418 call store_release() for strings that have been copied - if the string is at
1419 the start of a block (and therefore the only thing in it, because we aren't
1420 doing any other gets), the block gets freed. We can only do this because we
1421 know there are no other calls to store_get() going on. */
1422
1423 if (ptr >= header_size - 4)
1424 {
1425 int oldsize = header_size;
1426 /* header_size += 256; */
1427 header_size *= 2;
1428 if (!store_extend(next->text, oldsize, header_size))
1429 {
1430 uschar *newtext = store_get(header_size);
1431 memcpy(newtext, next->text, ptr);
1432 store_release(next->text);
1433 next->text = newtext;
1434 }
1435 }
1436
1437 /* Cope with receiving a binary zero. There is dispute about whether
1438 these should be allowed in RFC 822 messages. The middle view is that they
1439 should not be allowed in headers, at least. Exim takes this attitude at
1440 the moment. We can't just stomp on them here, because we don't know that
1441 this line is a header yet. Set a flag to cause scanning later. */
1442
1443 if (ch == 0) had_zero++;
1444
1445 /* Test for termination. Lines in remote SMTP are terminated by CRLF, while
1446 those from data files use just LF. Treat LF in local SMTP input as a
1447 terminator too. Treat EOF as a line terminator always. */
1448
1449 if (ch == EOF) goto EOL;
1450
1451 /* FUDGE: There are sites out there that don't send CRs before their LFs, and
1452 other MTAs accept this. We are therefore forced into this "liberalisation"
1453 too, so we accept LF as a line terminator whatever the source of the message.
1454 However, if the first line of the message ended with a CRLF, we treat a bare
1455 LF specially by inserting a white space after it to ensure that the header
1456 line is not terminated. */
1457
1458 if (ch == '\n')
1459 {
1460 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = FALSE;
fb2274d4 1461 else if (first_line_ended_crlf) RECEIVE_UNGETC(' ');
059ec3d9
PH
1462 goto EOL;
1463 }
1464
1465 /* This is not the end of the line. If this is SMTP input and this is
1466 the first character in the line and it is a "." character, ignore it.
1467 This implements the dot-doubling rule, though header lines starting with
1468 dots aren't exactly common. They are legal in RFC 822, though. If the
1469 following is CRLF or LF, this is the line that that terminates the
1470 entire message. We set message_ended to indicate this has happened (to
1471 prevent further reading), and break out of the loop, having freed the
1472 empty header, and set next = NULL to indicate no data line. */
1473
1474 if (ptr == 0 && ch == '.' && (smtp_input || dot_ends))
1475 {
fb2274d4 1476 ch = (RECEIVE_GETC)();
059ec3d9
PH
1477 if (ch == '\r')
1478 {
fb2274d4 1479 ch = (RECEIVE_GETC)();
059ec3d9
PH
1480 if (ch != '\n')
1481 {
fb2274d4 1482 RECEIVE_UNGETC(ch);
059ec3d9
PH
1483 ch = '\r'; /* Revert to CR */
1484 }
1485 }
1486 if (ch == '\n')
1487 {
1488 message_ended = END_DOT;
1489 store_reset(next);
1490 next = NULL;
1491 break; /* End character-reading loop */
1492 }
1493
1494 /* For non-SMTP input, the dot at the start of the line was really a data
1495 character. What is now in ch is the following character. We guaranteed
1496 enough space for this above. */
1497
1498 if (!smtp_input)
1499 {
1500 next->text[ptr++] = '.';
1501 message_size++;
1502 }
1503 }
1504
1505 /* If CR is immediately followed by LF, end the line, ignoring the CR, and
1506 remember this case if this is the first line ending. */
1507
1508 if (ch == '\r')
1509 {
fb2274d4 1510 ch = (RECEIVE_GETC)();
059ec3d9
PH
1511 if (ch == '\n')
1512 {
1513 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = TRUE;
1514 goto EOL;
1515 }
1516
1517 /* Otherwise, put back the character after CR, and turn the bare CR
1518 into LF SP. */
1519
fb2274d4 1520 ch = (RECEIVE_UNGETC)(ch);
059ec3d9
PH
1521 next->text[ptr++] = '\n';
1522 message_size++;
1523 ch = ' ';
1524 }
1525
1526 /* We have a data character for the header line. */
1527
1528 next->text[ptr++] = ch; /* Add to buffer */
1529 message_size++; /* Total message size so far */
1530
1531 /* Handle failure due to a humungously long header section. The >= allows
1532 for the terminating \n. Add what we have so far onto the headers list so
1533 that it gets reflected in any error message, and back up the just-read
1534 character. */
1535
1536 if (message_size >= header_maxsize)
1537 {
1538 next->text[ptr] = 0;
1539 next->slen = ptr;
1540 next->type = htype_other;
1541 next->next = NULL;
1542 header_last->next = next;
1543 header_last = next;
1544
1545 log_write(0, LOG_MAIN, "ridiculously long message header received from "
1546 "%s (more than %d characters): message abandoned",
1547 sender_host_unknown? sender_ident : sender_fullhost, header_maxsize);
1548
1549 if (smtp_input)
1550 {
1551 smtp_reply = US"552 Message header is ridiculously long";
1552 receive_swallow_smtp();
1553 goto TIDYUP; /* Skip to end of function */
1554 }
1555
1556 else
1557 {
1558 give_local_error(ERRMESS_VLONGHEADER,
1559 string_sprintf("message header longer than %d characters received: "
1560 "message not accepted", header_maxsize), US"", error_rc, stdin,
1561 header_list->next);
1562 /* Does not return */
1563 }
1564 }
1565
1566 continue; /* With next input character */
1567
1568 /* End of header line reached */
1569
1570 EOL:
2e0c1448
PH
1571
1572 /* Keep track of lines for BSMTP errors and overall message_linecount. */
1573
1574 receive_linecount++;
1575 message_linecount++;
059ec3d9
PH
1576
1577 /* Now put in the terminating newline. There is always space for
1578 at least two more characters. */
1579
1580 next->text[ptr++] = '\n';
1581 message_size++;
1582
1583 /* A blank line signals the end of the headers; release the unwanted
1584 space and set next to NULL to indicate this. */
1585
1586 if (ptr == 1)
1587 {
1588 store_reset(next);
1589 next = NULL;
1590 break;
1591 }
1592
1593 /* There is data in the line; see if the next input character is a
1594 whitespace character. If it is, we have a continuation of this header line.
1595 There is always space for at least one character at this point. */
1596
1597 if (ch != EOF)
1598 {
fb2274d4 1599 int nextch = (RECEIVE_GETC)();
059ec3d9
PH
1600 if (nextch == ' ' || nextch == '\t')
1601 {
1602 next->text[ptr++] = nextch;
1603 message_size++;
1604 continue; /* Iterate the loop */
1605 }
fb2274d4 1606 else if (nextch != EOF) (RECEIVE_UNGETC)(nextch); /* For next time */
059ec3d9
PH
1607 else ch = EOF; /* Cause main loop to exit at end */
1608 }
1609
1610 /* We have got to the real line end. Terminate the string and release store
1611 beyond it. If it turns out to be a real header, internal binary zeros will
1612 be squashed later. */
1613
1614 next->text[ptr] = 0;
1615 next->slen = ptr;
1616 store_reset(next->text + ptr + 1);
1617
1618 /* Check the running total size against the overall message size limit. We
1619 don't expect to fail here, but if the overall limit is set less than MESSAGE_
1620 MAXSIZE and a big header is sent, we want to catch it. Just stop reading
1621 headers - the code to read the body will then also hit the buffer. */
1622
1623 if (message_size > thismessage_size_limit) break;
1624
1625 /* A line that is not syntactically correct for a header also marks
1626 the end of the headers. In this case, we leave next containing the
1627 first data line. This might actually be several lines because of the
1628 continuation logic applied above, but that doesn't matter.
1629
1630 It turns out that smail, and presumably sendmail, accept leading lines
1631 of the form
1632
1633 From ph10 Fri Jan 5 12:35 GMT 1996
1634
1635 in messages. The "mail" command on Solaris 2 sends such lines. I cannot
1636 find any documentation of this, but for compatibility it had better be
1637 accepted. Exim restricts it to the case of non-smtp messages, and
1638 treats it as an alternative to the -f command line option. Thus it is
1639 ignored except for trusted users or filter testing. Otherwise it is taken
1640 as the sender address, unless -f was used (sendmail compatibility).
1641
1642 It further turns out that some UUCPs generate the From_line in a different
1643 format, e.g.
1644
1645 From ph10 Fri, 7 Jan 97 14:00:00 GMT
1646
1647 The regex for matching these things is now capable of recognizing both
1648 formats (including 2- and 4-digit years in the latter). In fact, the regex
1649 is now configurable, as is the expansion string to fish out the sender.
1650
1651 Even further on it has been discovered that some broken clients send
1652 these lines in SMTP messages. There is now an option to ignore them from
1653 specified hosts or networks. Sigh. */
1654
1655 if (header_last == header_list &&
1656 (!smtp_input
1657 ||
1658 (sender_host_address != NULL &&
1659 verify_check_host(&ignore_fromline_hosts) == OK)
1660 ||
1661 (sender_host_address == NULL && ignore_fromline_local)
1662 ) &&
1663 regex_match_and_setup(regex_From, next->text, 0, -1))
1664 {
1665 if (!sender_address_forced)
1666 {
1667 uschar *uucp_sender = expand_string(uucp_from_sender);
1668 if (uucp_sender == NULL)
1669 {
1670 log_write(0, LOG_MAIN|LOG_PANIC,
1671 "expansion of \"%s\" failed after matching "
1672 "\"From \" line: %s", uucp_from_sender, expand_string_message);
1673 }
1674 else
1675 {
1676 int start, end, domain;
1677 uschar *errmess;
1678 uschar *newsender = parse_extract_address(uucp_sender, &errmess,
1679 &start, &end, &domain, TRUE);
1680 if (newsender != NULL)
1681 {
1682 if (domain == 0 && newsender[0] != 0)
1683 newsender = rewrite_address_qualify(newsender, FALSE);
1684
f05da2e8 1685 if (filter_test != FTEST_NONE || receive_check_set_sender(newsender))
059ec3d9
PH
1686 {
1687 sender_address = newsender;
1688
f05da2e8 1689 if (trusted_caller || filter_test != FTEST_NONE)
059ec3d9
PH
1690 {
1691 authenticated_sender = NULL;
1692 originator_name = US"";
1693 sender_local = FALSE;
1694 }
1695
f05da2e8 1696 if (filter_test != FTEST_NONE)
059ec3d9
PH
1697 printf("Sender taken from \"From \" line\n");
1698 }
1699 }
1700 }
1701 }
1702 }
1703
1704 /* Not a leading "From " line. Check to see if it is a valid header line.
1705 Header names may contain any non-control characters except space and colon,
1706 amazingly. */
1707
1708 else
1709 {
1710 uschar *p = next->text;
1711
1712 /* If not a valid header line, break from the header reading loop, leaving
1713 next != NULL, indicating that it holds the first line of the body. */
1714
1715 if (isspace(*p)) break;
1716 while (mac_isgraph(*p) && *p != ':') p++;
1717 while (isspace(*p)) p++;
1718 if (*p != ':')
1719 {
1720 body_zerocount = had_zero;
1721 break;
1722 }
1723
1724 /* We have a valid header line. If there were any binary zeroes in
1725 the line, stomp on them here. */
1726
1727 if (had_zero > 0)
1728 for (p = next->text; p < next->text + ptr; p++) if (*p == 0) *p = '?';
1729
1730 /* It is perfectly legal to have an empty continuation line
1731 at the end of a header, but it is confusing to humans
1732 looking at such messages, since it looks like a blank line.
1733 Reduce confusion by removing redundant white space at the
1734 end. We know that there is at least one printing character
1735 (the ':' tested for above) so there is no danger of running
1736 off the end. */
1737
1738 p = next->text + ptr - 2;
1739 for (;;)
1740 {
1741 while (*p == ' ' || *p == '\t') p--;
1742 if (*p != '\n') break;
1743 ptr = (p--) - next->text + 1;
1744 message_size -= next->slen - ptr;
1745 next->text[ptr] = 0;
1746 next->slen = ptr;
1747 }
1748
1749 /* Add the header to the chain */
1750
1751 next->type = htype_other;
1752 next->next = NULL;
1753 header_last->next = next;
1754 header_last = next;
1755
1756 /* Check the limit for individual line lengths. This comes after adding to
1757 the chain so that the failing line is reflected if a bounce is generated
1758 (for a local message). */
1759
1760 if (header_line_maxsize > 0 && next->slen > header_line_maxsize)
1761 {
1762 log_write(0, LOG_MAIN, "overlong message header line received from "
1763 "%s (more than %d characters): message abandoned",
1764 sender_host_unknown? sender_ident : sender_fullhost,
1765 header_line_maxsize);
1766
1767 if (smtp_input)
1768 {
1769 smtp_reply = US"552 A message header line is too long";
1770 receive_swallow_smtp();
1771 goto TIDYUP; /* Skip to end of function */
1772 }
1773
1774 else
1775 {
1776 give_local_error(ERRMESS_VLONGHDRLINE,
1777 string_sprintf("message header line longer than %d characters "
1778 "received: message not accepted", header_line_maxsize), US"",
1779 error_rc, stdin, header_list->next);
1780 /* Does not return */
1781 }
1782 }
1783
1784 /* Note if any resent- fields exist. */
1785
1786 if (!resents_exist && strncmpic(next->text, US"resent-", 7) == 0)
1787 {
1788 resents_exist = TRUE;
1789 resent_prefix = US"Resent-";
1790 }
1791 }
1792
1793 /* The line has been handled. If we have hit EOF, break out of the loop,
1794 indicating no pending data line. */
1795
1796 if (ch == EOF) { next = NULL; break; }
1797
1798 /* Set up for the next header */
1799
1800 header_size = 256;
1801 next = store_get(sizeof(header_line));
1802 next->text = store_get(header_size);
1803 ptr = 0;
1804 had_zero = 0;
1805 } /* Continue, starting to read the next header */
1806
1807/* At this point, we have read all the headers into a data structure in main
1808store. The first header is still the dummy placeholder for the Received: header
1809we are going to generate a bit later on. If next != NULL, it contains the first
1810data line - which terminated the headers before reaching a blank line (not the
1811normal case). */
1812
1813DEBUG(D_receive)
1814 {
1815 debug_printf(">>Headers received:\n");
1816 for (h = header_list->next; h != NULL; h = h->next)
1817 debug_printf("%s", h->text);
1818 debug_printf("\n");
1819 }
1820
1821/* End of file on any SMTP connection is an error. If an incoming SMTP call
1822is dropped immediately after valid headers, the next thing we will see is EOF.
1823We must test for this specially, as further down the reading of the data is
1824skipped if already at EOF. */
1825
1826if (smtp_input && (receive_feof)())
1827 {
1828 smtp_reply = handle_lost_connection(US" (after header)");
1829 smtp_yield = FALSE;
1830 goto TIDYUP; /* Skip to end of function */
1831 }
1832
1833/* If this is a filter test run and no headers were read, output a warning
1834in case there is a mistake in the test message. */
1835
f05da2e8 1836if (filter_test != FTEST_NONE && header_list->next == NULL)
059ec3d9
PH
1837 printf("Warning: no message headers read\n");
1838
1839
1840/* Scan the headers to identify them. Some are merely marked for later
1841processing; some are dealt with here. */
1842
1843for (h = header_list->next; h != NULL; h = h->next)
1844 {
1845 BOOL is_resent = strncmpic(h->text, US"resent-", 7) == 0;
1846 if (is_resent) contains_resent_headers = TRUE;
1847
1848 switch (header_checkname(h, is_resent))
1849 {
059ec3d9 1850 case htype_bcc:
2cbb4081 1851 h->type = htype_bcc; /* Both Bcc: and Resent-Bcc: */
059ec3d9
PH
1852 break;
1853
059ec3d9 1854 case htype_cc:
2cbb4081 1855 h->type = htype_cc; /* Both Cc: and Resent-Cc: */
059ec3d9
PH
1856 break;
1857
1858 /* Record whether a Date: or Resent-Date: header exists, as appropriate. */
1859
1860 case htype_date:
1861 date_header_exists = !resents_exist || is_resent;
1862 break;
1863
1864 /* Same comments as about Return-Path: below. */
1865
1866 case htype_delivery_date:
1867 if (delivery_date_remove) h->type = htype_old;
1868 break;
1869
1870 /* Same comments as about Return-Path: below. */
1871
1872 case htype_envelope_to:
1873 if (envelope_to_remove) h->type = htype_old;
1874 break;
1875
1876 /* Mark all "From:" headers so they get rewritten. Save the one that is to
1877 be used for Sender: checking. For Sendmail compatibility, if the "From:"
1878 header consists of just the login id of the user who called Exim, rewrite
1879 it with the gecos field first. Apply this rule to Resent-From: if there
1880 are resent- fields. */
1881
1882 case htype_from:
1883 h->type = htype_from;
1884 if (!resents_exist || is_resent)
1885 {
1886 from_header = h;
1887 if (!smtp_input)
1888 {
1889 uschar *s = Ustrchr(h->text, ':') + 1;
1890 while (isspace(*s)) s++;
1891 if (strncmpic(s, originator_login, h->slen - (s - h->text) - 1) == 0)
1892 {
1893 uschar *name = is_resent? US"Resent-From" : US"From";
1894 header_add(htype_from, "%s: %s <%s@%s>\n", name, originator_name,
1895 originator_login, qualify_domain_sender);
1896 from_header = header_last;
1897 h->type = htype_old;
1898 DEBUG(D_receive|D_rewrite)
1899 debug_printf("rewrote \"%s:\" header using gecos\n", name);
1900 }
1901 }
1902 }
1903 break;
1904
1905 /* Identify the Message-id: header for generating "in-reply-to" in the
1906 autoreply transport. For incoming logging, save any resent- value. In both
1907 cases, take just the first of any multiples. */
1908
1909 case htype_id:
1910 if (msgid_header == NULL && (!resents_exist || is_resent))
1911 {
1912 msgid_header = h;
1913 h->type = htype_id;
1914 }
1915 break;
1916
1917 /* Flag all Received: headers */
1918
1919 case htype_received:
1920 h->type = htype_received;
1921 received_count++;
1922 break;
1923
1924 /* "Reply-to:" is just noted (there is no resent-reply-to field) */
1925
1926 case htype_reply_to:
1927 h->type = htype_reply_to;
1928 break;
1929
1930 /* The Return-path: header is supposed to be added to messages when
1931 they leave the SMTP system. We shouldn't receive messages that already
1932 contain Return-path. However, since Exim generates Return-path: on
1933 local delivery, resent messages may well contain it. We therefore
1934 provide an option (which defaults on) to remove any Return-path: headers
1935 on input. Removal actually means flagging as "old", which prevents the
1936 header being transmitted with the message. */
1937
1938 case htype_return_path:
1939 if (return_path_remove) h->type = htype_old;
1940
1941 /* If we are testing a mail filter file, use the value of the
1942 Return-Path: header to set up the return_path variable, which is not
1943 otherwise set. However, remove any <> that surround the address
1944 because the variable doesn't have these. */
1945
f05da2e8 1946 if (filter_test != FTEST_NONE)
059ec3d9
PH
1947 {
1948 uschar *start = h->text + 12;
1949 uschar *end = start + Ustrlen(start);
1950 while (isspace(*start)) start++;
1951 while (end > start && isspace(end[-1])) end--;
1952 if (*start == '<' && end[-1] == '>')
1953 {
1954 start++;
1955 end--;
1956 }
1957 return_path = string_copyn(start, end - start);
1958 printf("Return-path taken from \"Return-path:\" header line\n");
1959 }
1960 break;
1961
1962 /* If there is a "Sender:" header and the message is locally originated,
8800895a
PH
1963 and from an untrusted caller and suppress_local_fixups is not set, or if we
1964 are in submission mode for a remote message, mark it "old" so that it will
1965 not be transmitted with the message, unless active_local_sender_retain is
1966 set. (This can only be true if active_local_from_check is false.) If there
1967 are any resent- headers in the message, apply this rule to Resent-Sender:
1968 instead of Sender:. Messages with multiple resent- header sets cannot be
1969 tidily handled. (For this reason, at least one MUA - Pine - turns old
1970 resent- headers into X-resent- headers when resending, leaving just one
1971 set.) */
059ec3d9
PH
1972
1973 case htype_sender:
69358f02 1974 h->type = ((!active_local_sender_retain &&
8800895a
PH
1975 (
1976 (sender_local && !trusted_caller && !suppress_local_fixups)
1977 || submission_mode
1978 )
059ec3d9
PH
1979 ) &&
1980 (!resents_exist||is_resent))?
1981 htype_old : htype_sender;
1982 break;
1983
1984 /* Remember the Subject: header for logging. There is no Resent-Subject */
1985
1986 case htype_subject:
1987 subject_header = h;
1988 break;
1989
1990 /* "To:" gets flagged, and the existence of a recipient header is noted,
1991 whether it's resent- or not. */
1992
1993 case htype_to:
1994 h->type = htype_to;
1995 /****
1996 to_or_cc_header_exists = TRUE;
1997 ****/
1998 break;
1999 }
2000 }
2001
2002/* Extract recipients from the headers if that is required (the -t option).
2003Note that this is documented as being done *before* any address rewriting takes
2004place. There are two possibilities:
2005
2006(1) According to sendmail documentation for Solaris, IRIX, and HP-UX, any
2007recipients already listed are to be REMOVED from the message. Smail 3 works
2008like this. We need to build a non-recipients tree for that list, because in
2009subsequent processing this data is held in a tree and that's what the
2010spool_write_header() function expects. Make sure that non-recipient addresses
2011are fully qualified and rewritten if necessary.
2012
2013(2) According to other sendmail documentation, -t ADDS extracted recipients to
2014those in the command line arguments (and it is rumoured some other MTAs do
2015this). Therefore, there is an option to make Exim behave this way.
2016
2017*** Notes on "Resent-" header lines ***
2018
2019The presence of resent-headers in the message makes -t horribly ambiguous.
2020Experiments with sendmail showed that it uses recipients for all resent-
2021headers, totally ignoring the concept of "sets of resent- headers" as described
2022in RFC 2822 section 3.6.6. Sendmail also amalgamates them into a single set
2023with all the addresses in one instance of each header.
2024
2025This seems to me not to be at all sensible. Before release 4.20, Exim 4 gave an
2026error for -t if there were resent- headers in the message. However, after a
2027discussion on the mailing list, I've learned that there are MUAs that use
2028resent- headers with -t, and also that the stuff about sets of resent- headers
2029and their ordering in RFC 2822 is generally ignored. An MUA that submits a
2030message with -t and resent- header lines makes sure that only *its* resent-
2031headers are present; previous ones are often renamed as X-resent- for example.
2032
2033Consequently, Exim has been changed so that, if any resent- header lines are
2034present, the recipients are taken from all of the appropriate resent- lines,
2035and not from the ordinary To:, Cc:, etc. */
2036
2037if (extract_recip)
2038 {
2039 int rcount = 0;
2040 error_block **bnext = &bad_addresses;
2041
2042 if (extract_addresses_remove_arguments)
2043 {
2044 while (recipients_count-- > 0)
2045 {
2046 uschar *s = rewrite_address(recipients_list[recipients_count].address,
2047 TRUE, TRUE, global_rewrite_rules, rewrite_existflags);
2048 tree_add_nonrecipient(s);
2049 }
2050 recipients_list = NULL;
2051 recipients_count = recipients_list_max = 0;
2052 }
2053
2054 parse_allow_group = TRUE; /* Allow address group syntax */
2055
2056 /* Now scan the headers */
2057
2058 for (h = header_list->next; h != NULL; h = h->next)
2059 {
2060 if ((h->type == htype_to || h->type == htype_cc || h->type == htype_bcc) &&
2061 (!contains_resent_headers || strncmpic(h->text, US"resent-", 7) == 0))
2062 {
2063 uschar *s = Ustrchr(h->text, ':') + 1;
2064 while (isspace(*s)) s++;
2065
2066 while (*s != 0)
2067 {
2068 uschar *ss = parse_find_address_end(s, FALSE);
2069 uschar *recipient, *errmess, *p, *pp;
2070 int start, end, domain;
2071
2072 /* Check on maximum */
2073
2074 if (recipients_max > 0 && ++rcount > recipients_max)
2075 {
2076 give_local_error(ERRMESS_TOOMANYRECIP, US"too many recipients",
2077 US"message rejected: ", error_rc, stdin, NULL);
2078 /* Does not return */
2079 }
2080
2081 /* Make a copy of the address, and remove any internal newlines. These
2082 may be present as a result of continuations of the header line. The
2083 white space that follows the newline must not be removed - it is part
2084 of the header. */
2085
2086 pp = recipient = store_get(ss - s + 1);
2087 for (p = s; p < ss; p++) if (*p != '\n') *pp++ = *p;
2088 *pp = 0;
2089 recipient = parse_extract_address(recipient, &errmess, &start, &end,
2090 &domain, FALSE);
2091
2092 /* Keep a list of all the bad addresses so we can send a single
2093 error message at the end. However, an empty address is not an error;
2094 just ignore it. This can come from an empty group list like
2095
2096 To: Recipients of list:;
2097
2098 If there are no recipients at all, an error will occur later. */
2099
2100 if (recipient == NULL && Ustrcmp(errmess, "empty address") != 0)
2101 {
2102 int len = Ustrlen(s);
2103 error_block *b = store_get(sizeof(error_block));
2104 while (len > 0 && isspace(s[len-1])) len--;
2105 b->next = NULL;
2106 b->text1 = string_printing(string_copyn(s, len));
2107 b->text2 = errmess;
2108 *bnext = b;
2109 bnext = &(b->next);
2110 }
2111
2112 /* If the recipient is already in the nonrecipients tree, it must
2113 have appeared on the command line with the option extract_addresses_
2114 remove_arguments set. Do not add it to the recipients, and keep a note
2115 that this has happened, in order to give a better error if there are
2116 no recipients left. */
2117
2118 else if (recipient != NULL)
2119 {
2120 if (tree_search(tree_nonrecipients, recipient) == NULL)
2121 receive_add_recipient(recipient, -1);
2122 else
2123 extracted_ignored = TRUE;
2124 }
2125
2126 /* Move on past this address */
2127
2128 s = ss + (*ss? 1:0);
2129 while (isspace(*s)) s++;
2130 }
2131
2132 /* If this was the bcc: header, mark it "old", which means it
2133 will be kept on the spool, but not transmitted as part of the
2134 message. */
2135
2cbb4081 2136 if (h->type == htype_bcc) h->type = htype_old;
059ec3d9
PH
2137 } /* For appropriate header line */
2138 } /* For each header line */
2139
2140 parse_allow_group = FALSE; /* Reset group syntax flags */
2141 parse_found_group = FALSE;
2142 }
2143
2144/* Now build the unique message id. This has changed several times over the
2145lifetime of Exim. This description was rewritten for Exim 4.14 (February 2003).
2146Retaining all the history in the comment has become too unwieldy - read
2147previous release sources if you want it.
2148
2149The message ID has 3 parts: tttttt-pppppp-ss. Each part is a number in base 62.
2150The first part is the current time, in seconds. The second part is the current
2151pid. Both are large enough to hold 32-bit numbers in base 62. The third part
2152can hold a number in the range 0-3843. It used to be a computed sequence
2153number, but is now the fractional component of the current time in units of
21541/2000 of a second (i.e. a value in the range 0-1999). After a message has been
2155received, Exim ensures that the timer has ticked at the appropriate level
2156before proceeding, to avoid duplication if the pid happened to be re-used
2157within the same time period. It seems likely that most messages will take at
2158least half a millisecond to be received, so no delay will normally be
2159necessary. At least for some time...
2160
2161There is a modification when localhost_number is set. Formerly this was allowed
2162to be as large as 255. Now it is restricted to the range 0-16, and the final
2163component of the message id becomes (localhost_number * 200) + fractional time
2164in units of 1/200 of a second (i.e. a value in the range 0-3399).
2165
2166Some not-really-Unix operating systems use case-insensitive file names (Darwin,
2167Cygwin). For these, we have to use base 36 instead of base 62. Luckily, this
2168still allows the tttttt field to hold a large enough number to last for some
2169more decades, and the final two-digit field can hold numbers up to 1295, which
2170is enough for milliseconds (instead of 1/2000 of a second).
2171
2172However, the pppppp field cannot hold a 32-bit pid, but it can hold a 31-bit
2173pid, so it is probably safe because pids have to be positive. The
2174localhost_number is restricted to 0-10 for these hosts, and when it is set, the
2175final field becomes (localhost_number * 100) + fractional time in centiseconds.
2176
2177Note that string_base62() returns its data in a static storage block, so it
2178must be copied before calling string_base62() again. It always returns exactly
21796 characters.
2180
2181There doesn't seem to be anything in the RFC which requires a message id to
2182start with a letter, but Smail was changed to ensure this. The external form of
2183the message id (as supplied by string expansion) therefore starts with an
2184additional leading 'E'. The spool file names do not include this leading
2185letter and it is not used internally.
2186
2187NOTE: If ever the format of message ids is changed, the regular expression for
2188checking that a string is in this format must be updated in a corresponding
2189way. It appears in the initializing code in exim.c. The macro MESSAGE_ID_LENGTH
2190must also be changed to reflect the correct string length. Then, of course,
2191other programs that rely on the message id format will need updating too. */
2192
2193Ustrncpy(message_id, string_base62((long int)(message_id_tv.tv_sec)), 6);
2194message_id[6] = '-';
2195Ustrncpy(message_id + 7, string_base62((long int)getpid()), 6);
2196
2197/* Deal with the case where the host number is set. The value of the number was
2198checked when it was read, to ensure it isn't too big. The timing granularity is
2199left in id_resolution so that an appropriate wait can be done after receiving
2200the message, if necessary (we hope it won't be). */
2201
2202if (host_number_string != NULL)
2203 {
2204 id_resolution = (BASE_62 == 62)? 5000 : 10000;
2205 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2206 string_base62((long int)(
2207 host_number * (1000000/id_resolution) +
2208 message_id_tv.tv_usec/id_resolution)) + 4);
2209 }
2210
2211/* Host number not set: final field is just the fractional time at an
2212appropriate resolution. */
2213
2214else
2215 {
2216 id_resolution = (BASE_62 == 62)? 500 : 1000;
2217 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2218 string_base62((long int)(message_id_tv.tv_usec/id_resolution)) + 4);
2219 }
2220
2221/* Add the current message id onto the current process info string if
2222it will fit. */
2223
2224(void)string_format(process_info + process_info_len,
2225 PROCESS_INFO_SIZE - process_info_len, " id=%s", message_id);
2226
2227/* If we are using multiple input directories, set up the one for this message
2228to be the least significant base-62 digit of the time of arrival. Otherwise
2229ensure that it is an empty string. */
2230
2231message_subdir[0] = split_spool_directory? message_id[5] : 0;
2232
2233/* Now that we have the message-id, if there is no message-id: header, generate
8800895a
PH
2234one, but only for local (without suppress_local_fixups) or submission mode
2235messages. This can be user-configured if required, but we had better flatten
2236any illegal characters therein. */
059ec3d9 2237
8800895a
PH
2238if (msgid_header == NULL &&
2239 ((sender_host_address == NULL && !suppress_local_fixups)
2240 || submission_mode))
059ec3d9
PH
2241 {
2242 uschar *p;
2243 uschar *id_text = US"";
2244 uschar *id_domain = primary_hostname;
2245
2246 /* Permit only letters, digits, dots, and hyphens in the domain */
2247
2248 if (message_id_domain != NULL)
2249 {
2250 uschar *new_id_domain = expand_string(message_id_domain);
2251 if (new_id_domain == NULL)
2252 {
2253 if (!expand_string_forcedfail)
2254 log_write(0, LOG_MAIN|LOG_PANIC,
2255 "expansion of \"%s\" (message_id_header_domain) "
2256 "failed: %s", message_id_domain, expand_string_message);
2257 }
2258 else if (*new_id_domain != 0)
2259 {
2260 id_domain = new_id_domain;
2261 for (p = id_domain; *p != 0; p++)
2262 if (!isalnum(*p) && *p != '.') *p = '-'; /* No need to test '-' ! */
2263 }
2264 }
2265
2266 /* Permit all characters except controls and RFC 2822 specials in the
2267 additional text part. */
2268
2269 if (message_id_text != NULL)
2270 {
2271 uschar *new_id_text = expand_string(message_id_text);
2272 if (new_id_text == NULL)
2273 {
2274 if (!expand_string_forcedfail)
2275 log_write(0, LOG_MAIN|LOG_PANIC,
2276 "expansion of \"%s\" (message_id_header_text) "
2277 "failed: %s", message_id_text, expand_string_message);
2278 }
2279 else if (*new_id_text != 0)
2280 {
2281 id_text = new_id_text;
2282 for (p = id_text; *p != 0; p++)
2283 if (mac_iscntrl_or_special(*p)) *p = '-';
2284 }
2285 }
2286
2287 /* Add the header line */
2288
2289 header_add(htype_id, "%sMessage-Id: <%s%s%s@%s>\n", resent_prefix,
2290 message_id_external, (*id_text == 0)? "" : ".", id_text, id_domain);
2291 }
2292
2293/* If we are to log recipients, keep a copy of the raw ones before any possible
2294rewriting. Must copy the count, because later ACLs and the local_scan()
2295function may mess with the real recipients. */
2296
2297if ((log_extra_selector & LX_received_recipients) != 0)
2298 {
2299 raw_recipients = store_get(recipients_count * sizeof(uschar *));
2300 for (i = 0; i < recipients_count; i++)
2301 raw_recipients[i] = string_copy(recipients_list[i].address);
2302 raw_recipients_count = recipients_count;
2303 }
2304
2305/* Ensure the recipients list is fully qualified and rewritten. Unqualified
2306recipients will get here only if the conditions were right (allow_unqualified_
2307recipient is TRUE). */
2308
2309for (i = 0; i < recipients_count; i++)
2310 recipients_list[i].address =
2311 rewrite_address(recipients_list[i].address, TRUE, TRUE,
2312 global_rewrite_rules, rewrite_existflags);
2313
8800895a
PH
2314/* If there is no From: header, generate one for local (without
2315suppress_local_fixups) or submission_mode messages. If there is no sender
2316address, but the sender is local or this is a local delivery error, use the
2317originator login. This shouldn't happen for genuine bounces, but might happen
2318for autoreplies. The addition of From: must be done *before* checking for the
2319possible addition of a Sender: header, because untrusted_set_sender allows an
2320untrusted user to set anything in the envelope (which might then get info
2321From:) but we still want to ensure a valid Sender: if it is required. */
2322
2323if (from_header == NULL &&
2324 ((sender_host_address == NULL && !suppress_local_fixups)
2325 || submission_mode))
059ec3d9 2326 {
2fe1a124
PH
2327 uschar *oname = US"";
2328
2329 /* Use the originator_name if this is a locally submitted message and the
2330 caller is not trusted. For trusted callers, use it only if -F was used to
2331 force its value or if we have a non-SMTP message for which -f was not used
2332 to set the sender. */
2333
2334 if (sender_host_address == NULL)
2335 {
2336 if (!trusted_caller || sender_name_forced ||
2337 (!smtp_input && !sender_address_forced))
2338 oname = originator_name;
2339 }
2340
2341 /* For non-locally submitted messages, the only time we use the originator
2342 name is when it was forced by the /name= option on control=submission. */
2343
2344 else
2345 {
2346 if (submission_name != NULL) oname = submission_name;
2347 }
2348
059ec3d9
PH
2349 /* Envelope sender is empty */
2350
2351 if (sender_address[0] == 0)
2352 {
87ba3f5f
PH
2353 uschar *fromstart, *fromend;
2354
2355 fromstart = string_sprintf("%sFrom: %s%s", resent_prefix,
2fe1a124
PH
2356 oname, (oname[0] == 0)? "" : " <");
2357 fromend = (oname[0] == 0)? US"" : US">";
87ba3f5f 2358
059ec3d9
PH
2359 if (sender_local || local_error_message)
2360 {
87ba3f5f
PH
2361 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2362 local_part_quote(originator_login), qualify_domain_sender,
2363 fromend);
059ec3d9
PH
2364 }
2365 else if (submission_mode && authenticated_id != NULL)
2366 {
2367 if (submission_domain == NULL)
2368 {
87ba3f5f
PH
2369 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2370 local_part_quote(authenticated_id), qualify_domain_sender,
2371 fromend);
059ec3d9
PH
2372 }
2373 else if (submission_domain[0] == 0) /* empty => whole address set */
2374 {
87ba3f5f
PH
2375 header_add(htype_from, "%s%s%s\n", fromstart, authenticated_id,
2376 fromend);
059ec3d9
PH
2377 }
2378 else
2379 {
87ba3f5f
PH
2380 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2381 local_part_quote(authenticated_id), submission_domain,
2382 fromend);
059ec3d9
PH
2383 }
2384 from_header = header_last; /* To get it checked for Sender: */
2385 }
2386 }
2387
2388 /* There is a non-null envelope sender. Build the header using the original
2389 sender address, before any rewriting that might have been done while
2390 verifying it. */
2391
2392 else
2393 {
87ba3f5f 2394 header_add(htype_from, "%sFrom: %s%s%s%s\n", resent_prefix,
2fe1a124
PH
2395 oname,
2396 (oname[0] == 0)? "" : " <",
87ba3f5f
PH
2397 (sender_address_unrewritten == NULL)?
2398 sender_address : sender_address_unrewritten,
2fe1a124 2399 (oname[0] == 0)? "" : ">");
059ec3d9
PH
2400
2401 from_header = header_last; /* To get it checked for Sender: */
2402 }
2403 }
2404
2405
8800895a
PH
2406/* If the sender is local (without suppress_local_fixups), or if we are in
2407submission mode and there is an authenticated_id, check that an existing From:
2408is correct, and if not, generate a Sender: header, unless disabled. Any
2409previously-existing Sender: header was removed above. Note that sender_local,
2410as well as being TRUE if the caller of exim is not trusted, is also true if a
2411trusted caller did not supply a -f argument for non-smtp input. To allow
2412trusted callers to forge From: without supplying -f, we have to test explicitly
2413here. If the From: header contains more than one address, then the call to
2414parse_extract_address fails, and a Sender: header is inserted, as required. */
059ec3d9
PH
2415
2416if (from_header != NULL &&
69358f02 2417 (active_local_from_check &&
8800895a 2418 ((sender_local && !trusted_caller && !suppress_local_fixups) ||
69358f02 2419 (submission_mode && authenticated_id != NULL))
059ec3d9
PH
2420 ))
2421 {
2422 BOOL make_sender = TRUE;
2423 int start, end, domain;
2424 uschar *errmess;
2425 uschar *from_address =
2426 parse_extract_address(Ustrchr(from_header->text, ':') + 1, &errmess,
2427 &start, &end, &domain, FALSE);
2428 uschar *generated_sender_address;
2429
2430 if (submission_mode)
2431 {
2432 if (submission_domain == NULL)
2433 {
2434 generated_sender_address = string_sprintf("%s@%s",
2435 local_part_quote(authenticated_id), qualify_domain_sender);
2436 }
2437 else if (submission_domain[0] == 0) /* empty => full address */
2438 {
2439 generated_sender_address = string_sprintf("%s",
2440 authenticated_id);
2441 }
2442 else
2443 {
2444 generated_sender_address = string_sprintf("%s@%s",
2445 local_part_quote(authenticated_id), submission_domain);
2446 }
2447 }
2448 else
2449 generated_sender_address = string_sprintf("%s@%s",
2450 local_part_quote(originator_login), qualify_domain_sender);
2451
2452 /* Remove permitted prefixes and suffixes from the local part of the From:
2453 address before doing the comparison with the generated sender. */
2454
2455 if (from_address != NULL)
2456 {
2457 int slen;
2458 uschar *at = (domain == 0)? NULL : from_address + domain - 1;
2459
2460 if (at != NULL) *at = 0;
2461 from_address += route_check_prefix(from_address, local_from_prefix);
2462 slen = route_check_suffix(from_address, local_from_suffix);
2463 if (slen > 0)
2464 {
2465 memmove(from_address+slen, from_address, Ustrlen(from_address)-slen);
2466 from_address += slen;
2467 }
2468 if (at != NULL) *at = '@';
2469
2470 if (strcmpic(generated_sender_address, from_address) == 0 ||
2471 (domain == 0 && strcmpic(from_address, originator_login) == 0))
2472 make_sender = FALSE;
2473 }
2474
2475 /* We have to cause the Sender header to be rewritten if there are
2476 appropriate rewriting rules. */
2477
2478 if (make_sender)
2479 {
2fe1a124 2480 if (submission_mode && submission_name == NULL)
059ec3d9
PH
2481 header_add(htype_sender, "%sSender: %s\n", resent_prefix,
2482 generated_sender_address);
2483 else
2484 header_add(htype_sender, "%sSender: %s <%s>\n",
2fe1a124
PH
2485 resent_prefix,
2486 submission_mode? submission_name : originator_name,
2487 generated_sender_address);
059ec3d9 2488 }
87ba3f5f
PH
2489
2490 /* Ensure that a non-null envelope sender address corresponds to the
2491 submission mode sender address. */
2492
2493 if (submission_mode && sender_address[0] != 0)
2494 {
2495 if (sender_address_unrewritten == NULL)
2496 sender_address_unrewritten = sender_address;
2497 sender_address = generated_sender_address;
2498 log_write(L_address_rewrite, LOG_MAIN,
2499 "\"%s\" from env-from rewritten as \"%s\" by submission mode",
2500 sender_address_unrewritten, generated_sender_address);
2501 }
059ec3d9
PH
2502 }
2503
2504
2505/* If there are any rewriting rules, apply them to the sender address, unless
2506it has already been rewritten as part of verification for SMTP input. */
2507
2508if (global_rewrite_rules != NULL && sender_address_unrewritten == NULL &&
2509 sender_address[0] != 0)
2510 {
2511 sender_address = rewrite_address(sender_address, FALSE, TRUE,
2512 global_rewrite_rules, rewrite_existflags);
2513 DEBUG(D_receive|D_rewrite)
2514 debug_printf("rewritten sender = %s\n", sender_address);
2515 }
2516
2517
2518/* The headers must be run through rewrite_header(), because it ensures that
2519addresses are fully qualified, as well as applying any rewriting rules that may
2520exist.
2521
2522Qualification of header addresses in a message from a remote host happens only
2523if the host is in sender_unqualified_hosts or recipient_unqualified hosts, as
2524appropriate. For local messages, qualification always happens, unless -bnq is
2525used to explicitly suppress it. No rewriting is done for an unqualified address
2526that is left untouched.
2527
2528We start at the second header, skipping our own Received:. This rewriting is
2529documented as happening *after* recipient addresses are taken from the headers
2530by the -t command line option. An added Sender: gets rewritten here. */
2531
2532for (h = header_list->next; h != NULL; h = h->next)
2533 {
2534 header_line *newh = rewrite_header(h, NULL, NULL, global_rewrite_rules,
2535 rewrite_existflags, TRUE);
2536 if (newh != NULL) h = newh;
2537 }
2538
2539
2540/* An RFC 822 (sic) message is not legal unless it has at least one of "to",
2cbb4081 2541"cc", or "bcc". Note that although the minimal examples in RFC 822 show just
059ec3d9
PH
2542"to" or "bcc", the full syntax spec allows "cc" as well. If any resent- header
2543exists, this applies to the set of resent- headers rather than the normal set.
2544
2cbb4081
PH
2545The requirement for a recipient header has been removed in RFC 2822. At this
2546point in the code, earlier versions of Exim added a To: header for locally
2547submitted messages, and an empty Bcc: header for others. In the light of the
2548changes in RFC 2822, this was dropped in November 2003. */
059ec3d9 2549
059ec3d9
PH
2550
2551/* If there is no date header, generate one if the message originates locally
8800895a
PH
2552(i.e. not over TCP/IP) and suppress_local_fixups is not set, or if the
2553submission mode flag is set. Messages without Date: are not valid, but it seems
2554to be more confusing if Exim adds one to all remotely-originated messages. */
059ec3d9 2555
8800895a
PH
2556if (!date_header_exists &&
2557 ((sender_host_address == NULL && !suppress_local_fixups)
2558 || submission_mode))
059ec3d9
PH
2559 header_add(htype_other, "%sDate: %s\n", resent_prefix, tod_stamp(tod_full));
2560
2561search_tidyup(); /* Free any cached resources */
2562
2563/* Show the complete set of headers if debugging. Note that the first one (the
2564new Received:) has not yet been set. */
2565
2566DEBUG(D_receive)
2567 {
2568 debug_printf(">>Headers after rewriting and local additions:\n");
2569 for (h = header_list->next; h != NULL; h = h->next)
2570 debug_printf("%c %s", h->type, h->text);
2571 debug_printf("\n");
2572 }
2573
2574/* The headers are now complete in store. If we are running in filter
2575testing mode, that is all this function does. Return TRUE if the message
2576ended with a dot. */
2577
f05da2e8 2578if (filter_test != FTEST_NONE)
059ec3d9
PH
2579 {
2580 process_info[process_info_len] = 0;
2581 return message_ended == END_DOT;
2582 }
2583
2584/* Open a new spool file for the data portion of the message. We need
2585to access it both via a file descriptor and a stream. Try to make the
2586directory if it isn't there. Note re use of sprintf: spool_directory
2587is checked on input to be < 200 characters long. */
2588
2589sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory, message_subdir,
2590 message_id);
2591data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2592if (data_fd < 0)
2593 {
2594 if (errno == ENOENT)
2595 {
2596 uschar temp[16];
2597 sprintf(CS temp, "input/%s", message_subdir);
2598 if (message_subdir[0] == 0) temp[5] = 0;
2599 (void)directory_make(spool_directory, temp, INPUT_DIRECTORY_MODE, TRUE);
2600 data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2601 }
2602 if (data_fd < 0)
2603 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Failed to create spool file %s: %s",
2604 spool_name, strerror(errno));
2605 }
2606
2607/* Make sure the file's group is the Exim gid, and double-check the mode
2608because the group setting doesn't always get set automatically. */
2609
ff790e47
PH
2610(void)fchown(data_fd, exim_uid, exim_gid);
2611(void)fchmod(data_fd, SPOOL_MODE);
059ec3d9
PH
2612
2613/* We now have data file open. Build a stream for it and lock it. We lock only
2614the first line of the file (containing the message ID) because otherwise there
2615are problems when Exim is run under Cygwin (I'm told). See comments in
2616spool_in.c, where the same locking is done. */
2617
2618data_file = fdopen(data_fd, "w+");
2619lock_data.l_type = F_WRLCK;
2620lock_data.l_whence = SEEK_SET;
2621lock_data.l_start = 0;
2622lock_data.l_len = SPOOL_DATA_START_OFFSET;
2623
2624if (fcntl(data_fd, F_SETLK, &lock_data) < 0)
2625 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Cannot lock %s (%d): %s", spool_name,
2626 errno, strerror(errno));
2627
2628/* We have an open, locked data file. Write the message id to it to make it
2629self-identifying. Then read the remainder of the input of this message and
2630write it to the data file. If the variable next != NULL, it contains the first
2631data line (which was read as a header but then turned out not to have the right
2632format); write it (remembering that it might contain binary zeros). The result
2633of fwrite() isn't inspected; instead we call ferror() below. */
2634
2635fprintf(data_file, "%s-D\n", message_id);
2636if (next != NULL)
2637 {
2638 uschar *s = next->text;
2639 int len = next->slen;
f1e894f3 2640 (void)fwrite(s, 1, len, data_file);
059ec3d9
PH
2641 body_linecount++; /* Assumes only 1 line */
2642 }
2643
2644/* Note that we might already be at end of file, or the logical end of file
2645(indicated by '.'), or might have encountered an error while writing the
2646message id or "next" line. */
2647
2648if (!ferror(data_file) && !(receive_feof)() && message_ended != END_DOT)
2649 {
2650 if (smtp_input)
2651 {
2652 message_ended = read_message_data_smtp(data_file);
2653 receive_linecount++; /* The terminating "." line */
2654 }
2655 else message_ended = read_message_data(data_file);
2656
2657 receive_linecount += body_linecount; /* For BSMTP errors mainly */
2e0c1448 2658 message_linecount += body_linecount;
059ec3d9
PH
2659
2660 /* Handle premature termination of SMTP */
2661
2662 if (smtp_input && message_ended == END_EOF)
2663 {
2664 Uunlink(spool_name); /* Lose data file when closed */
2665 message_id[0] = 0; /* Indicate no message accepted */
2666 smtp_reply = handle_lost_connection(US"");
2667 smtp_yield = FALSE;
2668 goto TIDYUP; /* Skip to end of function */
2669 }
2670
2671 /* Handle message that is too big. Don't use host_or_ident() in the log
2672 message; we want to see the ident value even for non-remote messages. */
2673
2674 if (message_ended == END_SIZE)
2675 {
2676 Uunlink(spool_name); /* Lose the data file when closed */
2677 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2678
2679 log_write(L_size_reject, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2680 "message too big: read=%d max=%d",
2681 sender_address,
2682 (sender_fullhost == NULL)? "" : " H=",
2683 (sender_fullhost == NULL)? US"" : sender_fullhost,
2684 (sender_ident == NULL)? "" : " U=",
2685 (sender_ident == NULL)? US"" : sender_ident,
2686 message_size,
2687 thismessage_size_limit);
2688
2689 if (smtp_input)
2690 {
2691 smtp_reply = US"552 Message size exceeds maximum permitted";
2692 message_id[0] = 0; /* Indicate no message accepted */
2693 goto TIDYUP; /* Skip to end of function */
2694 }
2695 else
2696 {
2697 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2698 give_local_error(ERRMESS_TOOBIG,
2699 string_sprintf("message too big (max=%d)", thismessage_size_limit),
2700 US"message rejected: ", error_rc, data_file, header_list);
2701 /* Does not return */
2702 }
2703 }
2704 }
2705
2706/* Restore the standard SIGALRM handler for any subsequent processing. (For
2707example, there may be some expansion in an ACL that uses a timer.) */
2708
2709os_non_restarting_signal(SIGALRM, sigalrm_handler);
2710
2711/* The message body has now been read into the data file. Call fflush() to
2712empty the buffers in C, and then call fsync() to get the data written out onto
2713the disk, as fflush() doesn't do this (or at least, it isn't documented as
2714having to do this). If there was an I/O error on either input or output,
2715attempt to send an error message, and unlink the spool file. For non-SMTP input
2716we can then give up. Note that for SMTP input we must swallow the remainder of
2717the input in cases of output errors, since the far end doesn't expect to see
2718anything until the terminating dot line is sent. */
2719
2720if (fflush(data_file) == EOF || ferror(data_file) ||
2721 fsync(fileno(data_file)) < 0 || (receive_ferror)())
2722 {
2723 uschar *msg_errno = US strerror(errno);
2724 BOOL input_error = (receive_ferror)() != 0;
2725 uschar *msg = string_sprintf("%s error (%s) while receiving message from %s",
2726 input_error? "Input read" : "Spool write",
2727 msg_errno,
2728 (sender_fullhost != NULL)? sender_fullhost : sender_ident);
2729
2730 log_write(0, LOG_MAIN, "Message abandoned: %s", msg);
2731 Uunlink(spool_name); /* Lose the data file */
2732
2733 if (smtp_input)
2734 {
2735 if (input_error)
2736 smtp_reply = US"451 Error while reading input data";
2737 else
2738 {
2739 smtp_reply = US"451 Error while writing spool file";
2740 receive_swallow_smtp();
2741 }
2742 message_id[0] = 0; /* Indicate no message accepted */
2743 goto TIDYUP; /* Skip to end of function */
2744 }
2745
2746 else
2747 {
2748 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2749 give_local_error(ERRMESS_IOERR, msg, US"", error_rc, data_file,
2750 header_list);
2751 /* Does not return */
2752 }
2753 }
2754
2755
2756/* No I/O errors were encountered while writing the data file. */
2757
2758DEBUG(D_receive) debug_printf("Data file written for message %s\n", message_id);
2759
2760
2761/* If there were any bad addresses extracted by -t, or there were no recipients
2762left after -t, send a message to the sender of this message, or write it to
2763stderr if the error handling option is set that way. Note that there may
2764legitimately be no recipients for an SMTP message if they have all been removed
2765by "discard".
2766
2767We need to rewind the data file in order to read it. In the case of no
2768recipients or stderr error writing, throw the data file away afterwards, and
2769exit. (This can't be SMTP, which always ensures there's at least one
2770syntactically good recipient address.) */
2771
2772if (extract_recip && (bad_addresses != NULL || recipients_count == 0))
2773 {
2774 DEBUG(D_receive)
2775 {
2776 if (recipients_count == 0) debug_printf("*** No recipients\n");
2777 if (bad_addresses != NULL)
2778 {
2779 error_block *eblock = bad_addresses;
2780 debug_printf("*** Bad address(es)\n");
2781 while (eblock != NULL)
2782 {
2783 debug_printf(" %s: %s\n", eblock->text1, eblock->text2);
2784 eblock = eblock->next;
2785 }
2786 }
2787 }
2788
2789 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2790
2791 /* If configured to send errors to the sender, but this fails, force
2792 a failure error code. We use a special one for no recipients so that it
2793 can be detected by the autoreply transport. Otherwise error_rc is set to
2794 errors_sender_rc, which is EXIT_FAILURE unless -oee was given, in which case
2795 it is EXIT_SUCCESS. */
2796
2797 if (error_handling == ERRORS_SENDER)
2798 {
2799 if (!moan_to_sender(
2800 (bad_addresses == NULL)?
2801 (extracted_ignored? ERRMESS_IGADDRESS : ERRMESS_NOADDRESS) :
2802 (recipients_list == NULL)? ERRMESS_BADNOADDRESS : ERRMESS_BADADDRESS,
2803 bad_addresses, header_list, data_file, FALSE))
2804 error_rc = (bad_addresses == NULL)? EXIT_NORECIPIENTS : EXIT_FAILURE;
2805 }
2806 else
2807 {
2808 if (bad_addresses == NULL)
2809 {
2810 if (extracted_ignored)
2811 fprintf(stderr, "exim: all -t recipients overridden by command line\n");
2812 else
2813 fprintf(stderr, "exim: no recipients in message\n");
2814 }
2815 else
2816 {
2817 fprintf(stderr, "exim: invalid address%s",
2818 (bad_addresses->next == NULL)? ":" : "es:\n");
2819 while (bad_addresses != NULL)
2820 {
2821 fprintf(stderr, " %s: %s\n", bad_addresses->text1,
2822 bad_addresses->text2);
2823 bad_addresses = bad_addresses->next;
2824 }
2825 }
2826 }
2827
2828 if (recipients_count == 0 || error_handling == ERRORS_STDERR)
2829 {
2830 Uunlink(spool_name);
f1e894f3 2831 (void)fclose(data_file);
059ec3d9
PH
2832 exim_exit(error_rc);
2833 }
2834 }
2835
2836/* Data file successfully written. Generate text for the Received: header by
2837expanding the configured string, and adding a timestamp. By leaving this
2838operation till now, we ensure that the timestamp is the time that message
2839reception was completed. However, this is deliberately done before calling the
2840data ACL and local_scan().
2841
2842This Received: header may therefore be inspected by the data ACL and by code in
2843the local_scan() function. When they have run, we update the timestamp to be
2844the final time of reception.
2845
2846If there is just one recipient, set up its value in the $received_for variable
2847for use when we generate the Received: header.
2848
2849Note: the checking for too many Received: headers is handled by the delivery
2850code. */
2851
2852timestamp = expand_string(US"${tod_full}");
2853if (recipients_count == 1) received_for = recipients_list[0].address;
2854received = expand_string(received_header_text);
2855received_for = NULL;
2856
2857if (received == NULL)
2858 {
2859 Uunlink(spool_name); /* Lose the data file */
2860 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Expansion of \"%s\" "
2861 "(received_header_text) failed: %s", string_printing(received_header_text),
2862 expand_string_message);
2863 }
2864
2865/* The first element on the header chain is reserved for the Received header,
2866so all we have to do is fill in the text pointer, and set the type. However, if
2867the result of the expansion is an empty string, we leave the header marked as
2868"old" so as to refrain from adding a Received header. */
2869
2870if (received[0] == 0)
2871 {
2872 received_header->text = string_sprintf("Received: ; %s\n", timestamp);
2873 received_header->type = htype_old;
2874 }
2875else
2876 {
2877 received_header->text = string_sprintf("%s; %s\n", received, timestamp);
2878 received_header->type = htype_received;
2879 }
2880
2881received_header->slen = Ustrlen(received_header->text);
2882
2883DEBUG(D_receive) debug_printf(">>Generated Received: header line\n%c %s",
2884 received_header->type, received_header->text);
2885
2886/* Set the value of message_body_size for the DATA ACL and for local_scan() */
2887
2888message_body_size = (fstat(data_fd, &statbuf) == 0)?
2889 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
2890
2891/* If an ACL from any RCPT commands set up any warning headers to add, do so
2892now, before running the DATA ACL. */
2893
2894add_acl_headers(US"MAIL or RCPT");
2895
2896/* If an ACL is specified for checking things at this stage of reception of a
2897message, run it, unless all the recipients were removed by "discard" in earlier
2898ACLs. That is the only case in which recipients_count can be zero at this
2899stage. Set deliver_datafile to point to the data file so that $message_body and
2900$message_body_end can be extracted if needed. Allow $recipients in expansions.
2901*/
2902
2903deliver_datafile = data_fd;
2904
2905if (recipients_count == 0)
2906 {
2907 blackholed_by = recipients_discarded? US"MAIL ACL" : US"RCPT ACL";
2908 }
2909else
2910 {
2911 enable_dollar_recipients = TRUE;
2912
2913 /* Handle interactive SMTP messages */
2914
2915 if (smtp_input && !smtp_batched_input)
2916 {
8523533c 2917
fb2274d4
TK
2918#ifdef EXPERIMENTAL_DOMAINKEYS
2919 dk_exim_verify_finish();
2920#endif
2921
8523533c 2922#ifdef WITH_CONTENT_SCAN
54cdb463
PH
2923 if (acl_smtp_mime != NULL &&
2924 !run_mime_acl(acl_smtp_mime, &smtp_yield, &smtp_reply, &blackholed_by))
2925 goto TIDYUP;
8523533c
TK
2926#endif /* WITH_CONTENT_SCAN */
2927
54cdb463
PH
2928 /* Check the recipients count again, as the MIME ACL might have changed
2929 them. */
8523533c 2930
059ec3d9
PH
2931 if (acl_smtp_data != NULL && recipients_count > 0)
2932 {
2933 uschar *user_msg, *log_msg;
2934 rc = acl_check(ACL_WHERE_DATA, NULL, acl_smtp_data, &user_msg, &log_msg);
2935 add_acl_headers(US"DATA");
2936 if (rc == DISCARD)
2937 {
2938 recipients_count = 0;
2939 blackholed_by = US"DATA ACL";
8e669ac1
PH
2940 if (log_msg != NULL)
2941 blackhole_log_msg = string_sprintf(": %s", log_msg);
059ec3d9
PH
2942 }
2943 else if (rc != OK)
2944 {
2945 Uunlink(spool_name);
8523533c
TK
2946#ifdef WITH_CONTENT_SCAN
2947 unspool_mbox();
2948#endif
059ec3d9
PH
2949 if (smtp_handle_acl_fail(ACL_WHERE_DATA, rc, user_msg, log_msg) != 0)
2950 smtp_yield = FALSE; /* No more messsages after dropped connection */
2951 smtp_reply = US""; /* Indicate reply already sent */
2952 message_id[0] = 0; /* Indicate no message accepted */
2953 goto TIDYUP; /* Skip to end of function */
2954 }
2955 }
2956 }
2957
2958 /* Handle non-SMTP and batch SMTP (i.e. non-interactive) messages. Note that
2959 we cannot take different actions for permanent and temporary rejections. */
2960
54cdb463 2961 else
059ec3d9 2962 {
54cdb463
PH
2963
2964#ifdef WITH_CONTENT_SCAN
2965 if (acl_not_smtp_mime != NULL &&
2966 !run_mime_acl(acl_not_smtp_mime, &smtp_yield, &smtp_reply,
2967 &blackholed_by))
2968 goto TIDYUP;
2969#endif /* WITH_CONTENT_SCAN */
2970
2971 if (acl_not_smtp != NULL)
059ec3d9 2972 {
54cdb463
PH
2973 uschar *user_msg, *log_msg;
2974 rc = acl_check(ACL_WHERE_NOTSMTP, NULL, acl_not_smtp, &user_msg, &log_msg);
2975 if (rc == DISCARD)
059ec3d9 2976 {
54cdb463
PH
2977 recipients_count = 0;
2978 blackholed_by = US"non-SMTP ACL";
2979 if (log_msg != NULL)
2980 blackhole_log_msg = string_sprintf(": %s", log_msg);
059ec3d9 2981 }
54cdb463 2982 else if (rc != OK)
059ec3d9 2983 {
54cdb463
PH
2984 Uunlink(spool_name);
2985#ifdef WITH_CONTENT_SCAN
2986 unspool_mbox();
2987#endif
2988 log_write(0, LOG_MAIN|LOG_REJECT, "F=<%s> rejected by non-SMTP ACL: %s",
2989 sender_address, log_msg);
2990 if (user_msg == NULL) user_msg = US"local configuration problem";
2991 if (smtp_batched_input)
2992 {
2993 moan_smtp_batch(NULL, "%d %s", 550, user_msg);
2994 /* Does not return */
2995 }
2996 else
2997 {
2998 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2999 give_local_error(ERRMESS_LOCAL_ACL, user_msg,
3000 US"message rejected by non-SMTP ACL: ", error_rc, data_file,
3001 header_list);
3002 /* Does not return */
3003 }
059ec3d9 3004 }
54cdb463 3005 add_acl_headers(US"non-SMTP");
059ec3d9 3006 }
059ec3d9
PH
3007 }
3008
54cdb463
PH
3009 /* The applicable ACLs have been run */
3010
059ec3d9
PH
3011 if (deliver_freeze) frozen_by = US"ACL"; /* for later logging */
3012 if (queue_only_policy) queued_by = US"ACL";
3013
3014 enable_dollar_recipients = FALSE;
3015 }
3016
8523533c
TK
3017#ifdef WITH_CONTENT_SCAN
3018unspool_mbox();
3019#endif
3020
059ec3d9
PH
3021/* The final check on the message is to run the scan_local() function. The
3022version supplied with Exim always accepts, but this is a hook for sysadmins to
3023supply their own checking code. The local_scan() function is run even when all
3024the recipients have been discarded. */
3025
3026lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3027
3028/* Arrange to catch crashes in local_scan(), so that the -D file gets
3029deleted, and the incident gets logged. */
3030
3031os_non_restarting_signal(SIGSEGV, local_scan_crash_handler);
3032os_non_restarting_signal(SIGFPE, local_scan_crash_handler);
3033os_non_restarting_signal(SIGILL, local_scan_crash_handler);
3034os_non_restarting_signal(SIGBUS, local_scan_crash_handler);
3035
3036DEBUG(D_receive) debug_printf("calling local_scan(); timeout=%d\n",
3037 local_scan_timeout);
3038local_scan_data = NULL;
3039
3040os_non_restarting_signal(SIGALRM, local_scan_timeout_handler);
3041if (local_scan_timeout > 0) alarm(local_scan_timeout);
3042rc = local_scan(data_fd, &local_scan_data);
3043alarm(0);
3044os_non_restarting_signal(SIGALRM, sigalrm_handler);
3045
3046store_pool = POOL_MAIN; /* In case changed */
3047DEBUG(D_receive) debug_printf("local_scan() returned %d %s\n", rc,
3048 local_scan_data);
3049
3050os_non_restarting_signal(SIGSEGV, SIG_DFL);
3051os_non_restarting_signal(SIGFPE, SIG_DFL);
3052os_non_restarting_signal(SIGILL, SIG_DFL);
3053os_non_restarting_signal(SIGBUS, SIG_DFL);
3054
3055/* The length check is paranoia against some runaway code, and also because
3056(for a success return) lines in the spool file are read into big_buffer. */
3057
3058if (local_scan_data != NULL)
3059 {
3060 int len = Ustrlen(local_scan_data);
3061 if (len > LOCAL_SCAN_MAX_RETURN) len = LOCAL_SCAN_MAX_RETURN;
3062 local_scan_data = string_copyn(local_scan_data, len);
3063 }
3064
3065if (rc == LOCAL_SCAN_ACCEPT_FREEZE)
3066 {
3067 if (!deliver_freeze) /* ACL might have already frozen */
3068 {
3069 deliver_freeze = TRUE;
3070 deliver_frozen_at = time(NULL);
3071 frozen_by = US"local_scan()";
3072 }
3073 rc = LOCAL_SCAN_ACCEPT;
3074 }
3075else if (rc == LOCAL_SCAN_ACCEPT_QUEUE)
3076 {
3077 if (!queue_only_policy) /* ACL might have already queued */
3078 {
3079 queue_only_policy = TRUE;
3080 queued_by = US"local_scan()";
3081 }
3082 rc = LOCAL_SCAN_ACCEPT;
3083 }
3084
3085/* Message accepted: remove newlines in local_scan_data because otherwise
3086the spool file gets corrupted. Ensure that all recipients are qualified. */
3087
3088if (rc == LOCAL_SCAN_ACCEPT)
3089 {
3090 if (local_scan_data != NULL)
3091 {
3092 uschar *s;
3093 for (s = local_scan_data; *s != 0; s++) if (*s == '\n') *s = ' ';
3094 }
3095 for (i = 0; i < recipients_count; i++)
3096 {
3097 recipient_item *r = recipients_list + i;
3098 r->address = rewrite_address_qualify(r->address, TRUE);
3099 if (r->errors_to != NULL)
3100 r->errors_to = rewrite_address_qualify(r->errors_to, TRUE);
3101 }
3102 if (recipients_count == 0 && blackholed_by == NULL)
3103 blackholed_by = US"local_scan";
3104 }
3105
3106/* Message rejected: newlines permitted in local_scan_data to generate
3107multiline SMTP responses. */
3108
3109else
3110 {
3111 uschar *istemp = US"";
3112 uschar *s = NULL;
3113 int size = 0;
3114 int sptr = 0;
3115 int code;
3116
3117 errmsg = local_scan_data;
3118
3119 Uunlink(spool_name); /* Cancel this message */
3120 switch(rc)
3121 {
3122 default:
3123 log_write(0, LOG_MAIN, "invalid return %d from local_scan(). Temporary "
3124 "rejection given", rc);
3125 goto TEMPREJECT;
3126
3127 case LOCAL_SCAN_REJECT_NOLOGHDR:
3128 log_extra_selector &= ~LX_rejected_header;
3129 /* Fall through */
3130
3131 case LOCAL_SCAN_REJECT:
3132 code = 550;
3133 if (errmsg == NULL) errmsg = US"Administrative prohibition";
3134 break;
3135
3136 case LOCAL_SCAN_TEMPREJECT_NOLOGHDR:
3137 log_extra_selector &= ~LX_rejected_header;
3138 /* Fall through */
3139
3140 case LOCAL_SCAN_TEMPREJECT:
3141 TEMPREJECT:
3142 code = 451;
3143 if (errmsg == NULL) errmsg = US"Temporary local problem";
3144 istemp = US"temporarily ";
3145 break;
3146 }
3147
3148 s = string_append(s, &size, &sptr, 2, US"F=",
3149 (sender_address[0] == 0)? US"<>" : sender_address);
3150 s = add_host_info_for_log(s, &size, &sptr);
3151 s[sptr] = 0;
3152
3153 log_write(0, LOG_MAIN|LOG_REJECT, "%s %srejected by local_scan(): %.256s",
3154 s, istemp, string_printing(errmsg));
3155
3156 if (smtp_input)
3157 {
3158 if (!smtp_batched_input)
3159 {
3160 smtp_respond(code, TRUE, errmsg);
3161 message_id[0] = 0; /* Indicate no message accepted */
3162 smtp_reply = US""; /* Indicate reply already sent */
3163 goto TIDYUP; /* Skip to end of function */
3164 }
3165 else
3166 {
3167 moan_smtp_batch(NULL, "%d %s", code, errmsg);
3168 /* Does not return */
3169 }
3170 }
3171 else
3172 {
3173 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3174 give_local_error(ERRMESS_LOCAL_SCAN, errmsg,
3175 US"message rejected by local scan code: ", error_rc, data_file,
3176 header_list);
3177 /* Does not return */
3178 }
3179 }
3180
3181/* Reset signal handlers to ignore signals that previously would have caused
3182the message to be abandoned. */
3183
3184signal(SIGTERM, SIG_IGN);
3185signal(SIGINT, SIG_IGN);
3186
3187/* Ensure the first time flag is set in the newly-received message. */
3188
3189deliver_firsttime = TRUE;
3190
8523533c
TK
3191#ifdef EXPERIMENTAL_BRIGHTMAIL
3192if (bmi_run == 1) {
3193 /* rewind data file */
3194 lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3195 bmi_verdicts = bmi_process_message(header_list, data_fd);
3196};
3197#endif
3198
059ec3d9
PH
3199/* Update the timstamp in our Received: header to account for any time taken by
3200an ACL or by local_scan(). The new time is the time that all reception
3201processing is complete. */
3202
3203timestamp = expand_string(US"${tod_full}");
3204tslen = Ustrlen(timestamp);
3205
3206memcpy(received_header->text + received_header->slen - tslen - 1,
3207 timestamp, tslen);
3208
3209/* In MUA wrapper mode, ignore queueing actions set by ACL or local_scan() */
3210
3211if (mua_wrapper)
3212 {
3213 deliver_freeze = FALSE;
3214 queue_only_policy = FALSE;
3215 }
3216
3217/* Keep the data file open until we have written the header file, in order to
3218hold onto the lock. In a -bh run, or if the message is to be blackholed, we
3219don't write the header file, and we unlink the data file. If writing the header
3220file fails, we have failed to accept this message. */
3221
3222if (host_checking || blackholed_by != NULL)
3223 {
3224 header_line *h;
3225 Uunlink(spool_name);
3226 msg_size = 0; /* Compute size for log line */
3227 for (h = header_list; h != NULL; h = h->next)
3228 if (h->type != '*') msg_size += h->slen;
3229 }
3230
3231/* Write the -H file */
3232
3233else
3234 {
3235 if ((msg_size = spool_write_header(message_id, SW_RECEIVING, &errmsg)) < 0)
3236 {
3237 log_write(0, LOG_MAIN, "Message abandoned: %s", errmsg);
3238 Uunlink(spool_name); /* Lose the data file */
3239
3240 if (smtp_input)
3241 {
3242 smtp_reply = US"451 Error in writing spool file";
3243 message_id[0] = 0; /* Indicate no message accepted */
3244 goto TIDYUP;
3245 }
3246 else
3247 {
3248 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3249 give_local_error(ERRMESS_IOERR, errmsg, US"", error_rc, data_file,
3250 header_list);
3251 /* Does not return */
3252 }
3253 }
3254 }
3255
3256
3257/* The message has now been successfully received. */
3258
3259receive_messagecount++;
3260
3261/* In SMTP sessions we may receive several in one connection. After each one,
3262we wait for the clock to tick at the level of message-id granularity. This is
3263so that the combination of time+pid is unique, even on systems where the pid
3264can be re-used within our time interval. We can't shorten the interval without
3265re-designing the message-id. See comments above where the message id is
3266created. This is Something For The Future. */
3267
3268message_id_tv.tv_usec = (message_id_tv.tv_usec/id_resolution) * id_resolution;
3269exim_wait_tick(&message_id_tv, id_resolution);
3270
3271/* Add data size to written header size. We do not count the initial file name
3272that is in the file, but we do add one extra for the notional blank line that
3273precedes the data. This total differs from message_size in that it include the
3274added Received: header and any other headers that got created locally. */
3275
3276fflush(data_file);
3277fstat(data_fd, &statbuf);
3278
3279msg_size += statbuf.st_size - SPOOL_DATA_START_OFFSET + 1;
3280
3281/* Generate a "message received" log entry. We do this by building up a dynamic
3282string as required. Since we commonly want to add two items at a time, use a
3283macro to simplify the coding. We log the arrival of a new message while the
3284file is still locked, just in case the machine is *really* fast, and delivers
3285it first! Include any message id that is in the message - since the syntax of a
3286message id is actually an addr-spec, we can use the parse routine to canonicize
3287it. */
3288
3289size = 256;
3290sptr = 0;
3291s = store_get(size);
3292
3293s = string_append(s, &size, &sptr, 2, US"<= ",
3294 (sender_address[0] == 0)? US"<>" : sender_address);
3295if (message_reference != NULL)
3296 s = string_append(s, &size, &sptr, 2, US" R=", message_reference);
3297
3298s = add_host_info_for_log(s, &size, &sptr);
3299
3300#ifdef SUPPORT_TLS
3301if ((log_extra_selector & LX_tls_cipher) != 0 && tls_cipher != NULL)
3302 s = string_append(s, &size, &sptr, 2, US" X=", tls_cipher);
3303if ((log_extra_selector & LX_tls_certificate_verified) != 0 &&
3304 tls_cipher != NULL)
3305 s = string_append(s, &size, &sptr, 2, US" CV=",
3306 tls_certificate_verified? "yes":"no");
3307if ((log_extra_selector & LX_tls_peerdn) != 0 && tls_peerdn != NULL)
3308 s = string_append(s, &size, &sptr, 3, US" DN=\"", tls_peerdn, US"\"");
3309#endif
3310
3311if (sender_host_authenticated != NULL)
3312 {
3313 s = string_append(s, &size, &sptr, 2, US" A=", sender_host_authenticated);
3314 if (authenticated_id != NULL)
3315 s = string_append(s, &size, &sptr, 2, US":", authenticated_id);
3316 }
3317
3318sprintf(CS big_buffer, "%d", msg_size);
3319s = string_append(s, &size, &sptr, 2, US" S=", big_buffer);
3320
3321/* If an addr-spec in a message-id contains a quoted string, it can contain
3322any characters except " \ and CR and so in particular it can contain NL!
3323Therefore, make sure we use a printing-characters only version for the log.
3324Also, allow for domain literals in the message id. */
3325
3326if (msgid_header != NULL)
3327 {
3328 uschar *old_id;
3329 BOOL save_allow_domain_literals = allow_domain_literals;
3330 allow_domain_literals = TRUE;
3331 old_id = parse_extract_address(Ustrchr(msgid_header->text, ':') + 1,
3332 &errmsg, &start, &end, &domain, FALSE);
3333 allow_domain_literals = save_allow_domain_literals;
3334 if (old_id != NULL)
3335 s = string_append(s, &size, &sptr, 2, US" id=", string_printing(old_id));
3336 }
3337
3338/* If subject logging is turned on, create suitable printing-character
3339text. By expanding $h_subject: we make use of the MIME decoding. */
3340
3341if ((log_extra_selector & LX_subject) != 0 && subject_header != NULL)
3342 {
3343 int i;
3344 uschar *p = big_buffer;
3345 uschar *ss = expand_string(US"$h_subject:");
3346
3347 /* Backslash-quote any double quotes or backslashes so as to make a
3348 a C-like string, and turn any non-printers into escape sequences. */
3349
3350 *p++ = '\"';
3351 if (*ss != 0) for (i = 0; i < 100 && ss[i] != 0; i++)
3352 {
3353 if (ss[i] == '\"' || ss[i] == '\\') *p++ = '\\';
3354 *p++ = ss[i];
3355 }
3356 *p++ = '\"';
3357 *p = 0;
3358 s = string_append(s, &size, &sptr, 2, US" T=", string_printing(big_buffer));
3359 }
3360
3361/* Terminate the string: string_cat() and string_append() leave room, but do
3362not put the zero in. */
3363
3364s[sptr] = 0;
3365
3366/* While writing to the log, set a flag to cause a call to receive_bomb_out()
3367if the log cannot be opened. */
3368
3369receive_call_bombout = TRUE;
3370log_write(0, LOG_MAIN |
3371 (((log_extra_selector & LX_received_recipients) != 0)? LOG_RECIPIENTS : 0) |
3372 (((log_extra_selector & LX_received_sender) != 0)? LOG_SENDER : 0),
3373 "%s", s);
3374receive_call_bombout = FALSE;
3375
3376/* Log any control actions taken by an ACL or local_scan(). */
3377
3378if (deliver_freeze) log_write(0, LOG_MAIN, "frozen by %s", frozen_by);
3379if (queue_only_policy) log_write(L_delay_delivery, LOG_MAIN,
3380 "no immediate delivery: queued by %s", queued_by);
3381
3382/* Create a message log file if message logs are being used and this message is
3383not blackholed. Write the reception stuff to it. We used to leave message log
3384creation until the first delivery, but this has proved confusing for somep
3385people. */
3386
3387if (message_logs && blackholed_by == NULL)
3388 {
3389 int fd;
3390
3391 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory, message_subdir,
3392 message_id);
3393 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3394
3395 if (fd < 0 && errno == ENOENT)
3396 {
3397 uschar temp[16];
3398 sprintf(CS temp, "msglog/%s", message_subdir);
3399 if (message_subdir[0] == 0) temp[6] = 0;
3400 (void)directory_make(spool_directory, temp, MSGLOG_DIRECTORY_MODE, TRUE);
3401 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3402 }
3403
3404 if (fd < 0)
3405 {
3406 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't open message log %s: %s",
3407 spool_name, strerror(errno));
3408 }
3409
3410 else
3411 {
3412 FILE *message_log = fdopen(fd, "a");
3413 if (message_log == NULL)
3414 {
3415 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't fdopen message log %s: %s",
3416 spool_name, strerror(errno));
f1e894f3 3417 (void)close(fd);
059ec3d9
PH
3418 }
3419 else
3420 {
3421 uschar *now = tod_stamp(tod_log);
3422 fprintf(message_log, "%s Received from %s\n", now, s+3);
3423 if (deliver_freeze) fprintf(message_log, "%s frozen by %s\n", now,
3424 frozen_by);
3425 if (queue_only_policy) fprintf(message_log,
3426 "%s no immediate delivery: queued by %s\n", now, queued_by);
f1e894f3 3427 (void)fclose(message_log);
059ec3d9
PH
3428 }
3429 }
3430 }
3431
3432store_reset(s); /* The store for the main log message can be reused */
3433
3434/* If the message is frozen, and freeze_tell is set, do the telling. */
3435
3436if (deliver_freeze && freeze_tell != NULL && freeze_tell[0] != 0)
3437 {
3438 moan_tell_someone(freeze_tell, NULL, US"Message frozen on arrival",
3439 "Message %s was frozen on arrival by %s.\nThe sender is <%s>.\n",
3440 message_id, frozen_by, sender_address);
3441 }
3442
3443
3444/* Either a message has been successfully received and written to the two spool
3445files, or an error in writing the spool has occurred for an SMTP message, or
3446an SMTP message has been rejected because of a bad sender. (For a non-SMTP
3447message we will have already given up because there's no point in carrying on!)
3448In either event, we must now close (and thereby unlock) the data file. In the
3449successful case, this leaves the message on the spool, ready for delivery. In
3450the error case, the spool file will be deleted. Then tidy up store, interact
3451with an SMTP call if necessary, and return.
3452
3453A fflush() was done earlier in the expectation that any write errors on the
3454data file will be flushed(!) out thereby. Nevertheless, it is theoretically
3455possible for fclose() to fail - but what to do? What has happened to the lock
3456if this happens? */
3457
3458TIDYUP:
f1e894f3
PH
3459process_info[process_info_len] = 0; /* Remove message id */
3460if (data_file != NULL) (void)fclose(data_file); /* Frees the lock */
059ec3d9
PH
3461
3462/* Now reset signal handlers to their defaults */
3463
3464signal(SIGTERM, SIG_DFL);
3465signal(SIGINT, SIG_DFL);
3466
3467/* Tell an SMTP caller the state of play, and arrange to return the SMTP return
3468value, which defaults TRUE - meaning there may be more incoming messages from
3469this connection. For non-SMTP callers (where there is only ever one message),
3470the default is FALSE. */
3471
3472if (smtp_input)
3473 {
3474 yield = smtp_yield;
3475
3476 /* Handle interactive SMTP callers. After several kinds of error, smtp_reply
3477 is set to the response. However, after an ACL error or local_scan() error,
3478 the response has already been sent, and smtp_reply is an empty string to
3479 indicate this. */
3480
3481 if (!smtp_batched_input)
3482 {
3483 if (smtp_reply == NULL)
3484 {
29aba418
TF
3485 if (fake_response != OK)
3486 smtp_respond(fake_response == DEFER ? 450 : 550,
3487 TRUE, fake_response_text);
8e669ac1
PH
3488 else
3489 smtp_printf("250 OK id=%s\r\n", message_id);
059ec3d9
PH
3490 if (host_checking)
3491 fprintf(stdout,
3492 "\n**** SMTP testing: that is not a real message id!\n\n");
3493 }
8523533c
TK
3494 else if (smtp_reply[0] != 0)
3495 {
29aba418
TF
3496 if (fake_response != OK && (smtp_reply[0] == '2'))
3497 smtp_respond(fake_response == DEFER ? 450 : 550,
3498 TRUE, fake_response_text);
8e669ac1 3499 else
6951ac6c
PH
3500 smtp_printf("%.1024s\r\n", smtp_reply);
3501 }
059ec3d9
PH
3502 }
3503
3504 /* For batched SMTP, generate an error message on failure, and do
3505 nothing on success. The function moan_smtp_batch() does not return -
3506 it exits from the program with a non-zero return code. */
3507
3508 else if (smtp_reply != NULL) moan_smtp_batch(NULL, "%s", smtp_reply);
3509 }
3510
3511
3512/* If blackholing, we can immediately log this message's sad fate. The data
3513file has already been unlinked, and the header file was never written to disk.
3514We must now indicate that nothing was received, to prevent a delivery from
3515starting. */
3516
3517if (blackholed_by != NULL)
3518 {
3519 uschar *detail = (local_scan_data != NULL)?
3520 string_printing(local_scan_data) :
3521 string_sprintf("(%s discarded recipients)", blackholed_by);
04f7d5b9 3522 log_write(0, LOG_MAIN, "=> blackhole %s%s", detail, blackhole_log_msg);
059ec3d9
PH
3523 log_write(0, LOG_MAIN, "Completed");
3524 message_id[0] = 0;
3525 }
3526
3527/* Reset headers so that logging of rejects for a subsequent message doesn't
3528include them. It is also important to set header_last = NULL before exiting
3529from this function, as this prevents certain rewrites that might happen during
3530subsequent verifying (of another incoming message) from trying to add headers
3531when they shouldn't. */
3532
3533header_list = header_last = NULL;
3534
3535return yield; /* TRUE if more messages (SMTP only) */
3536}
3537
3538/* End of receive.c */