CHUNKING/DKIM: fix handling of lines having a leading dot
[exim.git] / src / src / receive.c
CommitLineData
059ec3d9
PH
1/*************************************************
2* Exim - an Internet mail transport agent *
3*************************************************/
4
80fea873 5/* Copyright (c) University of Cambridge 1995 - 2016 */
059ec3d9
PH
6/* See the file NOTICE for conditions of use and distribution. */
7
8/* Code for receiving a message and setting up spool files. */
9
059ec3d9
PH
10#include "exim.h"
11
6a8f9482
TK
12#ifdef EXPERIMENTAL_DCC
13extern int dcc_ok;
14#endif
15
4840604e 16#ifdef EXPERIMENTAL_DMARC
c007c974 17# include "dmarc.h"
4840604e
TL
18#endif /* EXPERIMENTAL_DMARC */
19
059ec3d9
PH
20/*************************************************
21* Local static variables *
22*************************************************/
23
24static FILE *data_file = NULL;
25static int data_fd = -1;
41313d92 26static uschar *spool_name = US"";
059ec3d9
PH
27
28
29
30/*************************************************
31* Non-SMTP character reading functions *
32*************************************************/
33
34/* These are the default functions that are set up in the variables such as
35receive_getc initially. They just call the standard functions, passing stdin as
36the file. (When SMTP input is occurring, different functions are used by
37changing the pointer variables.) */
38
39int
40stdin_getc(void)
41{
42return getc(stdin);
43}
44
45int
46stdin_ungetc(int c)
47{
48return ungetc(c, stdin);
49}
50
51int
52stdin_feof(void)
53{
54return feof(stdin);
55}
56
57int
58stdin_ferror(void)
59{
60return ferror(stdin);
61}
62
63
64
65
66/*************************************************
67* Check that a set sender is allowed *
68*************************************************/
69
70/* This function is called when a local caller sets an explicit sender address.
71It checks whether this is permitted, which it is for trusted callers.
72Otherwise, it must match the pattern(s) in untrusted_set_sender.
73
74Arguments: the proposed sender address
75Returns: TRUE for a trusted caller
76 TRUE if the address has been set, untrusted_set_sender has been
77 set, and the address matches something in the list
78 FALSE otherwise
79*/
80
81BOOL
82receive_check_set_sender(uschar *newsender)
83{
84uschar *qnewsender;
85if (trusted_caller) return TRUE;
86if (newsender == NULL || untrusted_set_sender == NULL) return FALSE;
87qnewsender = (Ustrchr(newsender, '@') != NULL)?
88 newsender : string_sprintf("%s@%s", newsender, qualify_domain_sender);
89return
55414b25 90 match_address_list(qnewsender, TRUE, TRUE, CUSS &untrusted_set_sender, NULL, -1,
059ec3d9
PH
91 0, NULL) == OK;
92}
93
94
95
96
97/*************************************************
5cb8cbc6 98* Read space info for a partition *
059ec3d9
PH
99*************************************************/
100
8e669ac1
PH
101/* This function is called by receive_check_fs() below, and also by string
102expansion for variables such as $spool_space. The field names for the statvfs
5cb8cbc6
PH
103structure are macros, because not all OS have F_FAVAIL and it seems tidier to
104have macros for F_BAVAIL and F_FILES as well. Some kinds of file system do not
105have inodes, and they return -1 for the number available.
059ec3d9 106
5cb8cbc6
PH
107Later: It turns out that some file systems that do not have the concept of
108inodes return 0 rather than -1. Such systems should also return 0 for the total
8e669ac1 109number of inodes, so we require that to be greater than zero before returning
5cb8cbc6 110an inode count.
059ec3d9 111
5cb8cbc6
PH
112Arguments:
113 isspool TRUE for spool partition, FALSE for log partition
114 inodeptr address of int to receive inode count; -1 if there isn't one
8e669ac1 115
5cb8cbc6 116Returns: available on-root space, in kilobytes
8e669ac1
PH
117 -1 for log partition if there isn't one
118
119All values are -1 if the STATFS functions are not available.
059ec3d9
PH
120*/
121
8e669ac1 122int
5cb8cbc6 123receive_statvfs(BOOL isspool, int *inodeptr)
059ec3d9
PH
124{
125#ifdef HAVE_STATFS
059ec3d9 126struct STATVFS statbuf;
5cb8cbc6
PH
127uschar *path;
128uschar *name;
129uschar buffer[1024];
059ec3d9 130
5cb8cbc6 131/* The spool directory must always exist. */
059ec3d9 132
5cb8cbc6 133if (isspool)
059ec3d9 134 {
8e669ac1
PH
135 path = spool_directory;
136 name = US"spool";
137 }
138
059ec3d9
PH
139/* Need to cut down the log file path to the directory, and to ignore any
140appearance of "syslog" in it. */
141
5cb8cbc6 142else
059ec3d9 143 {
059ec3d9 144 int sep = ':'; /* Not variable - outside scripts use */
55414b25 145 const uschar *p = log_file_path;
8e669ac1 146 name = US"log";
059ec3d9
PH
147
148 /* An empty log_file_path means "use the default". This is the same as an
149 empty item in a list. */
150
151 if (*p == 0) p = US":";
55414b25
JH
152 while ((path = string_nextinlist(&p, &sep, buffer, sizeof(buffer))))
153 if (Ustrcmp(path, "syslog") != 0)
154 break;
059ec3d9 155
5cb8cbc6
PH
156 if (path == NULL) /* No log files */
157 {
8e669ac1
PH
158 *inodeptr = -1;
159 return -1;
160 }
059ec3d9 161
8e669ac1
PH
162 /* An empty string means use the default, which is in the spool directory.
163 But don't just use the spool directory, as it is possible that the log
5cb8cbc6 164 subdirectory has been symbolically linked elsewhere. */
059ec3d9 165
8e669ac1 166 if (path[0] == 0)
059ec3d9 167 {
5cb8cbc6
PH
168 sprintf(CS buffer, CS"%s/log", CS spool_directory);
169 path = buffer;
8e669ac1
PH
170 }
171 else
059ec3d9 172 {
8e669ac1 173 uschar *cp;
5cb8cbc6 174 if ((cp = Ustrrchr(path, '/')) != NULL) *cp = 0;
8e669ac1 175 }
5cb8cbc6 176 }
8e669ac1 177
8f128379 178/* We now have the path; do the business */
5cb8cbc6
PH
179
180memset(&statbuf, 0, sizeof(statbuf));
181
182if (STATVFS(CS path, &statbuf) != 0)
183 {
184 log_write(0, LOG_MAIN|LOG_PANIC, "cannot accept message: failed to stat "
185 "%s directory %s: %s", name, spool_directory, strerror(errno));
186 smtp_closedown(US"spool or log directory problem");
187 exim_exit(EXIT_FAILURE);
188 }
8e669ac1 189
5cb8cbc6
PH
190*inodeptr = (statbuf.F_FILES > 0)? statbuf.F_FAVAIL : -1;
191
192/* Disks are getting huge. Take care with computing the size in kilobytes. */
8e669ac1 193
5cb8cbc6
PH
194return (int)(((double)statbuf.F_BAVAIL * (double)statbuf.F_FRSIZE)/1024.0);
195
196/* Unable to find partition sizes in this environment. */
197
198#else
199*inodeptr = -1;
200return -1;
201#endif
202}
203
059ec3d9 204
059ec3d9 205
5cb8cbc6
PH
206
207/*************************************************
208* Check space on spool and log partitions *
209*************************************************/
210
211/* This function is called before accepting a message; if any thresholds are
212set, it checks them. If a message_size is supplied, it checks that there is
213enough space for that size plus the threshold - i.e. that the message won't
214reduce the space to the threshold. Not all OS have statvfs(); for those that
215don't, this function always returns TRUE. For some OS the old function and
216struct name statfs is used; that is handled by a macro, defined in exim.h.
217
218Arguments:
219 msg_size the (estimated) size of an incoming message
220
221Returns: FALSE if there isn't enough space, or if the information cannot
222 be obtained
223 TRUE if no check was done or there is enough space
224*/
225
226BOOL
227receive_check_fs(int msg_size)
228{
229int space, inodes;
230
231if (check_spool_space > 0 || msg_size > 0 || check_spool_inodes > 0)
232 {
8e669ac1
PH
233 space = receive_statvfs(TRUE, &inodes);
234
059ec3d9 235 DEBUG(D_receive)
5cb8cbc6
PH
236 debug_printf("spool directory space = %dK inodes = %d "
237 "check_space = %dK inodes = %d msg_size = %d\n",
238 space, inodes, check_spool_space, check_spool_inodes, msg_size);
8e669ac1
PH
239
240 if ((space >= 0 && space < check_spool_space) ||
5cb8cbc6 241 (inodes >= 0 && inodes < check_spool_inodes))
8e669ac1 242 {
5cb8cbc6
PH
243 log_write(0, LOG_MAIN, "spool directory space check failed: space=%d "
244 "inodes=%d", space, inodes);
059ec3d9
PH
245 return FALSE;
246 }
247 }
248
5cb8cbc6
PH
249if (check_log_space > 0 || check_log_inodes > 0)
250 {
8e669ac1
PH
251 space = receive_statvfs(FALSE, &inodes);
252
5cb8cbc6
PH
253 DEBUG(D_receive)
254 debug_printf("log directory space = %dK inodes = %d "
255 "check_space = %dK inodes = %d\n",
256 space, inodes, check_log_space, check_log_inodes);
8e669ac1
PH
257
258 if ((space >= 0 && space < check_log_space) ||
5cb8cbc6 259 (inodes >= 0 && inodes < check_log_inodes))
8e669ac1 260 {
5cb8cbc6
PH
261 log_write(0, LOG_MAIN, "log directory space check failed: space=%d "
262 "inodes=%d", space, inodes);
263 return FALSE;
264 }
8e669ac1
PH
265 }
266
059ec3d9
PH
267return TRUE;
268}
269
270
271
272/*************************************************
273* Bomb out while reading a message *
274*************************************************/
275
276/* The common case of wanting to bomb out is if a SIGTERM or SIGINT is
277received, or if there is a timeout. A rarer case might be if the log files are
278screwed up and Exim can't open them to record a message's arrival. Handling
279that case is done by setting a flag to cause the log functions to call this
280function if there is an ultimate disaster. That is why it is globally
281accessible.
282
8f128379
PH
283Arguments:
284 reason text reason to pass to the not-quit ACL
285 msg default SMTP response to give if in an SMTP session
059ec3d9
PH
286Returns: it doesn't
287*/
288
289void
8f128379 290receive_bomb_out(uschar *reason, uschar *msg)
059ec3d9 291{
ead37e6c
PP
292 static BOOL already_bombing_out;
293/* The smtp_notquit_exit() below can call ACLs which can trigger recursive
294timeouts, if someone has something slow in their quit ACL. Since the only
295things we should be doing are to close down cleanly ASAP, on the second
296pass we also close down stuff that might be opened again, before bypassing
297the ACL call and exiting. */
298
059ec3d9
PH
299/* If spool_name is set, it contains the name of the data file that is being
300written. Unlink it before closing so that it cannot be picked up by a delivery
301process. Ensure that any header file is also removed. */
302
ead37e6c 303if (spool_name[0] != '\0')
059ec3d9
PH
304 {
305 Uunlink(spool_name);
306 spool_name[Ustrlen(spool_name) - 1] = 'H';
307 Uunlink(spool_name);
ead37e6c 308 spool_name[0] = '\0';
059ec3d9
PH
309 }
310
311/* Now close the file if it is open, either as a fd or a stream. */
312
ead37e6c
PP
313if (data_file != NULL)
314 {
315 (void)fclose(data_file);
316 data_file = NULL;
317} else if (data_fd >= 0) {
318 (void)close(data_fd);
319 data_fd = -1;
320 }
059ec3d9 321
8f128379
PH
322/* Attempt to close down an SMTP connection tidily. For non-batched SMTP, call
323smtp_notquit_exit(), which runs the NOTQUIT ACL, if present, and handles the
324SMTP response. */
059ec3d9 325
ead37e6c 326if (!already_bombing_out)
059ec3d9 327 {
ead37e6c
PP
328 already_bombing_out = TRUE;
329 if (smtp_input)
330 {
331 if (smtp_batched_input)
332 moan_smtp_batch(NULL, "421 %s - message abandoned", msg); /* No return */
333 smtp_notquit_exit(reason, US"421", US"%s %s - closing connection.",
334 smtp_active_hostname, msg);
335 }
059ec3d9
PH
336 }
337
338/* Exit from the program (non-BSMTP cases) */
339
340exim_exit(EXIT_FAILURE);
341}
342
343
344/*************************************************
345* Data read timeout *
346*************************************************/
347
348/* Handler function for timeouts that occur while reading the data that
349comprises a message.
350
351Argument: the signal number
352Returns: nothing
353*/
354
355static void
356data_timeout_handler(int sig)
357{
358uschar *msg = NULL;
359
360sig = sig; /* Keep picky compilers happy */
361
362if (smtp_input)
363 {
364 msg = US"SMTP incoming data timeout";
365 log_write(L_lost_incoming_connection,
366 LOG_MAIN, "SMTP data timeout (message abandoned) on connection "
fed77020
PH
367 "from %s F=<%s>",
368 (sender_fullhost != NULL)? sender_fullhost : US"local process",
369 sender_address);
059ec3d9
PH
370 }
371else
372 {
373 fprintf(stderr, "exim: timed out while reading - message abandoned\n");
374 log_write(L_lost_incoming_connection,
375 LOG_MAIN, "timed out while reading local message");
376 }
377
8f128379 378receive_bomb_out(US"data-timeout", msg); /* Does not return */
059ec3d9
PH
379}
380
381
382
383/*************************************************
384* local_scan() timeout *
385*************************************************/
386
387/* Handler function for timeouts that occur while running a local_scan()
388function.
389
390Argument: the signal number
391Returns: nothing
392*/
393
394static void
395local_scan_timeout_handler(int sig)
396{
397sig = sig; /* Keep picky compilers happy */
398log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function timed out - "
399 "message temporarily rejected (size %d)", message_size);
8f128379
PH
400/* Does not return */
401receive_bomb_out(US"local-scan-timeout", US"local verification problem");
059ec3d9
PH
402}
403
404
405
406/*************************************************
407* local_scan() crashed *
408*************************************************/
409
410/* Handler function for signals that occur while running a local_scan()
411function.
412
413Argument: the signal number
414Returns: nothing
415*/
416
417static void
418local_scan_crash_handler(int sig)
419{
420log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function crashed with "
421 "signal %d - message temporarily rejected (size %d)", sig, message_size);
8f128379
PH
422/* Does not return */
423receive_bomb_out(US"local-scan-error", US"local verification problem");
059ec3d9
PH
424}
425
426
427/*************************************************
428* SIGTERM or SIGINT received *
429*************************************************/
430
431/* Handler for SIGTERM or SIGINT signals that occur while reading the
432data that comprises a message.
433
434Argument: the signal number
435Returns: nothing
436*/
437
438static void
439data_sigterm_sigint_handler(int sig)
440{
441uschar *msg = NULL;
442
443if (smtp_input)
444 {
445 msg = US"Service not available - SIGTERM or SIGINT received";
446 log_write(0, LOG_MAIN, "%s closed after %s", smtp_get_connection_info(),
447 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
448 }
449else
450 {
f05da2e8 451 if (filter_test == FTEST_NONE)
059ec3d9
PH
452 {
453 fprintf(stderr, "\nexim: %s received - message abandoned\n",
454 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
455 log_write(0, LOG_MAIN, "%s received while reading local message",
456 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
457 }
458 }
459
8f128379 460receive_bomb_out(US"signal-exit", msg); /* Does not return */
059ec3d9
PH
461}
462
463
464
465/*************************************************
466* Add new recipient to list *
467*************************************************/
468
469/* This function builds a list of recipient addresses in argc/argv
470format.
471
472Arguments:
473 recipient the next address to add to recipients_list
474 pno parent number for fixed aliases; -1 otherwise
475
476Returns: nothing
477*/
478
479void
480receive_add_recipient(uschar *recipient, int pno)
481{
482if (recipients_count >= recipients_list_max)
483 {
484 recipient_item *oldlist = recipients_list;
485 int oldmax = recipients_list_max;
486 recipients_list_max = recipients_list_max? 2*recipients_list_max : 50;
487 recipients_list = store_get(recipients_list_max * sizeof(recipient_item));
488 if (oldlist != NULL)
489 memcpy(recipients_list, oldlist, oldmax * sizeof(recipient_item));
490 }
491
492recipients_list[recipients_count].address = recipient;
493recipients_list[recipients_count].pno = pno;
8523533c
TK
494#ifdef EXPERIMENTAL_BRIGHTMAIL
495recipients_list[recipients_count].bmi_optin = bmi_current_optin;
496/* reset optin string pointer for next recipient */
497bmi_current_optin = NULL;
498#endif
6c1c3d1d
WB
499recipients_list[recipients_count].orcpt = NULL;
500recipients_list[recipients_count].dsn_flags = 0;
059ec3d9
PH
501recipients_list[recipients_count++].errors_to = NULL;
502}
503
504
505
506
fd98a5c6
JH
507/*************************************************
508* Send user response message *
509*************************************************/
61147df4 510
fd98a5c6
JH
511/* This function is passed a default response code and a user message. It calls
512smtp_message_code() to check and possibly modify the response code, and then
513calls smtp_respond() to transmit the response. I put this into a function
514just to avoid a lot of repetition.
61147df4
PP
515
516Arguments:
fd98a5c6
JH
517 code the response code
518 user_msg the user message
519
520Returns: nothing
61147df4
PP
521*/
522
8ccd00b1 523#ifndef DISABLE_PRDR
61147df4 524static void
fd98a5c6 525smtp_user_msg(uschar *code, uschar *user_msg)
61147df4 526{
fd98a5c6 527int len = 3;
4f6ae5c3 528smtp_message_code(&code, &len, &user_msg, NULL, TRUE);
fd98a5c6 529smtp_respond(code, len, TRUE, user_msg);
61147df4
PP
530}
531#endif
532
533
534
535
fd98a5c6 536
059ec3d9
PH
537/*************************************************
538* Remove a recipient from the list *
539*************************************************/
540
541/* This function is provided for local_scan() to use.
542
543Argument:
544 recipient address to remove
545
546Returns: TRUE if it did remove something; FALSE otherwise
547*/
548
549BOOL
550receive_remove_recipient(uschar *recipient)
551{
552int count;
553DEBUG(D_receive) debug_printf("receive_remove_recipient(\"%s\") called\n",
554 recipient);
555for (count = 0; count < recipients_count; count++)
556 {
557 if (Ustrcmp(recipients_list[count].address, recipient) == 0)
558 {
559 if ((--recipients_count - count) > 0)
560 memmove(recipients_list + count, recipients_list + count + 1,
54cdb463 561 (recipients_count - count)*sizeof(recipient_item));
059ec3d9
PH
562 return TRUE;
563 }
564 }
565return FALSE;
566}
567
568
569
570
571
572/*************************************************
573* Read data portion of a non-SMTP message *
574*************************************************/
575
576/* This function is called to read the remainder of a message (following the
577header) when the input is not from SMTP - we are receiving a local message on
578a standard input stream. The message is always terminated by EOF, and is also
579terminated by a dot on a line by itself if the flag dot_ends is TRUE. Split the
580two cases for maximum efficiency.
581
582Ensure that the body ends with a newline. This will naturally be the case when
583the termination is "\n.\n" but may not be otherwise. The RFC defines messages
584as "sequences of lines" - this of course strictly applies only to SMTP, but
585deliveries into BSD-type mailbox files also require it. Exim used to have a
586flag for doing this at delivery time, but as it was always set for all
587transports, I decided to simplify things by putting the check here instead.
588
589There is at least one MUA (dtmail) that sends CRLF via this interface, and
590other programs are known to do this as well. Exim used to have a option for
591dealing with this: in July 2003, after much discussion, the code has been
592changed to default to treat any of LF, CRLF, and bare CR as line terminators.
593
594However, for the case when a dot on a line by itself terminates a message, the
595only recognized terminating sequences before and after the dot are LF and CRLF.
596Otherwise, having read EOL . CR, you don't know whether to read another
597character or not.
598
599Internally, in messages stored in Exim's spool files, LF is used as the line
600terminator. Under the new regime, bare CRs will no longer appear in these
601files.
602
603Arguments:
604 fout a FILE to which to write the message
605
606Returns: One of the END_xxx values indicating why it stopped reading
607*/
608
609static int
610read_message_data(FILE *fout)
611{
612int ch_state;
613register int ch;
d677b2f2 614register int linelength = 0;
059ec3d9
PH
615
616/* Handle the case when only EOF terminates the message */
617
618if (!dot_ends)
619 {
620 register int last_ch = '\n';
621
80a47a2c 622 for (; (ch = (receive_getc)()) != EOF; last_ch = ch)
059ec3d9
PH
623 {
624 if (ch == 0) body_zerocount++;
625 if (last_ch == '\r' && ch != '\n')
626 {
d677b2f2
PH
627 if (linelength > max_received_linelength)
628 max_received_linelength = linelength;
629 linelength = 0;
059ec3d9
PH
630 if (fputc('\n', fout) == EOF) return END_WERROR;
631 message_size++;
632 body_linecount++;
633 }
634 if (ch == '\r') continue;
635
636 if (fputc(ch, fout) == EOF) return END_WERROR;
d677b2f2
PH
637 if (ch == '\n')
638 {
639 if (linelength > max_received_linelength)
640 max_received_linelength = linelength;
641 linelength = 0;
642 body_linecount++;
643 }
644 else linelength++;
059ec3d9
PH
645 if (++message_size > thismessage_size_limit) return END_SIZE;
646 }
647
648 if (last_ch != '\n')
649 {
d677b2f2
PH
650 if (linelength > max_received_linelength)
651 max_received_linelength = linelength;
059ec3d9
PH
652 if (fputc('\n', fout) == EOF) return END_WERROR;
653 message_size++;
654 body_linecount++;
655 }
656
657 return END_EOF;
658 }
659
660/* Handle the case when a dot on a line on its own, or EOF, terminates. */
661
662ch_state = 1;
663
80a47a2c 664while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
665 {
666 if (ch == 0) body_zerocount++;
667 switch (ch_state)
668 {
669 case 0: /* Normal state (previous char written) */
670 if (ch == '\n')
d677b2f2
PH
671 {
672 body_linecount++;
673 if (linelength > max_received_linelength)
674 max_received_linelength = linelength;
675 linelength = -1;
676 ch_state = 1;
677 }
059ec3d9
PH
678 else if (ch == '\r')
679 { ch_state = 2; continue; }
680 break;
681
682 case 1: /* After written "\n" */
683 if (ch == '.') { ch_state = 3; continue; }
6eb02f88 684 if (ch == '\r') { ch_state = 2; continue; }
3581f321
JH
685 if (ch == '\n') { body_linecount++; linelength = -1; }
686 else ch_state = 0;
059ec3d9
PH
687 break;
688
689 case 2:
690 body_linecount++; /* After unwritten "\r" */
d677b2f2
PH
691 if (linelength > max_received_linelength)
692 max_received_linelength = linelength;
059ec3d9 693 if (ch == '\n')
d677b2f2
PH
694 {
695 ch_state = 1;
696 linelength = -1;
697 }
059ec3d9
PH
698 else
699 {
700 if (message_size++, fputc('\n', fout) == EOF) return END_WERROR;
701 if (ch == '\r') continue;
702 ch_state = 0;
d677b2f2 703 linelength = 0;
059ec3d9
PH
704 }
705 break;
706
707 case 3: /* After "\n." (\n written, dot not) */
708 if (ch == '\n') return END_DOT;
709 if (ch == '\r') { ch_state = 4; continue; }
710 message_size++;
d677b2f2 711 linelength++;
059ec3d9
PH
712 if (fputc('.', fout) == EOF) return END_WERROR;
713 ch_state = 0;
714 break;
715
716 case 4: /* After "\n.\r" (\n written, rest not) */
717 if (ch == '\n') return END_DOT;
718 message_size += 2;
719 body_linecount++;
720 if (fputs(".\n", fout) == EOF) return END_WERROR;
721 if (ch == '\r') { ch_state = 2; continue; }
722 ch_state = 0;
723 break;
724 }
725
d677b2f2 726 linelength++;
059ec3d9
PH
727 if (fputc(ch, fout) == EOF) return END_WERROR;
728 if (++message_size > thismessage_size_limit) return END_SIZE;
729 }
730
731/* Get here if EOF read. Unless we have just written "\n", we need to ensure
732the message ends with a newline, and we must also write any characters that
733were saved up while testing for an ending dot. */
734
735if (ch_state != 1)
736 {
737 static uschar *ends[] = { US"\n", NULL, US"\n", US".\n", US".\n" };
738 if (fputs(CS ends[ch_state], fout) == EOF) return END_WERROR;
739 message_size += Ustrlen(ends[ch_state]);
740 body_linecount++;
741 }
742
743return END_EOF;
744}
745
746
747
748
749/*************************************************
750* Read data portion of an SMTP message *
751*************************************************/
752
753/* This function is called to read the remainder of an SMTP message (after the
754headers), or to skip over it when an error has occurred. In this case, the
755output file is passed as NULL.
756
757If any line begins with a dot, that character is skipped. The input should only
758be successfully terminated by CR LF . CR LF unless it is local (non-network)
759SMTP, in which case the CRs are optional, but...
760
761FUDGE: It seems that sites on the net send out messages with just LF
762terminators, despite the warnings in the RFCs, and other MTAs handle this. So
763we make the CRs optional in all cases.
764
765July 2003: Bare CRs cause trouble. We now treat them as line terminators as
766well, so that there are no CRs in spooled messages. However, the message
767terminating dot is not recognized between two bare CRs.
768
769Arguments:
770 fout a FILE to which to write the message; NULL if skipping
771
772Returns: One of the END_xxx values indicating why it stopped reading
773*/
774
775static int
776read_message_data_smtp(FILE *fout)
777{
778int ch_state = 0;
e4bdf652 779int ch;
7e3ce68e 780int linelength = 0;
059ec3d9 781
80a47a2c 782while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
783 {
784 if (ch == 0) body_zerocount++;
785 switch (ch_state)
786 {
787 case 0: /* After LF or CRLF */
788 if (ch == '.')
789 {
790 ch_state = 3;
791 continue; /* Don't ever write . after LF */
792 }
793 ch_state = 1;
794
795 /* Else fall through to handle as normal uschar. */
796
797 case 1: /* Normal state */
798 if (ch == '\n')
799 {
800 ch_state = 0;
801 body_linecount++;
1f5497b2
PH
802 if (linelength > max_received_linelength)
803 max_received_linelength = linelength;
804 linelength = -1;
059ec3d9
PH
805 }
806 else if (ch == '\r')
807 {
808 ch_state = 2;
809 continue;
810 }
811 break;
812
813 case 2: /* After (unwritten) CR */
814 body_linecount++;
1f5497b2
PH
815 if (linelength > max_received_linelength)
816 max_received_linelength = linelength;
817 linelength = -1;
059ec3d9
PH
818 if (ch == '\n')
819 {
820 ch_state = 0;
821 }
822 else
823 {
824 message_size++;
825 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 826 (void) cutthrough_put_nl();
059ec3d9
PH
827 if (ch != '\r') ch_state = 1; else continue;
828 }
829 break;
830
831 case 3: /* After [CR] LF . */
832 if (ch == '\n')
833 return END_DOT;
834 if (ch == '\r')
835 {
836 ch_state = 4;
837 continue;
838 }
1bc460a6
JH
839 /* The dot was removed at state 3. For a doubled dot, here, reinstate
840 it to cutthrough. The current ch, dot or not, is passed both to cutthrough
841 and to file below. */
842 if (ch == '.')
843 {
844 uschar c= ch;
845 (void) cutthrough_puts(&c, 1);
846 }
847 ch_state = 1;
059ec3d9
PH
848 break;
849
850 case 4: /* After [CR] LF . CR */
851 if (ch == '\n') return END_DOT;
852 message_size++;
853 body_linecount++;
854 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 855 (void) cutthrough_put_nl();
059ec3d9
PH
856 if (ch == '\r')
857 {
858 ch_state = 2;
859 continue;
860 }
861 ch_state = 1;
862 break;
863 }
864
865 /* Add the character to the spool file, unless skipping; then loop for the
866 next. */
867
868 message_size++;
1f5497b2 869 linelength++;
7e3ce68e 870 if (fout)
059ec3d9
PH
871 {
872 if (fputc(ch, fout) == EOF) return END_WERROR;
873 if (message_size > thismessage_size_limit) return END_SIZE;
874 }
e4bdf652
JH
875 if(ch == '\n')
876 (void) cutthrough_put_nl();
877 else
878 {
7e3ce68e 879 uschar c = ch;
e4bdf652
JH
880 (void) cutthrough_puts(&c, 1);
881 }
059ec3d9
PH
882 }
883
884/* Fall through here if EOF encountered. This indicates some kind of error,
885since a correct message is terminated by [CR] LF . [CR] LF. */
886
887return END_EOF;
888}
889
890
891
892
7e3ce68e
JH
893/* Variant of the above read_message_data_smtp() specialised for RFC 3030
894CHUNKING. We assume that the incoming has proper CRLF, so only have to scan
895for and strip CR. On the downside there are more protocol reasons to stop.
896
897Arguments:
898 fout a FILE to which to write the message; NULL if skipping
899
900Returns: One of the END_xxx values indicating why it stopped reading
901*/
902
903static int
904read_message_bdat_smtp(FILE *fout)
905{
906int ch;
907int linelength = 0;
908
909for (;;) switch (ch = bdat_getc())
910 {
911 case EOF: return END_EOF;
912 case EOD: return END_DOT;
913 case ERR: return END_PROTOCOL;
914
915 case '\r':
916 body_linecount++;
917 if (linelength > max_received_linelength)
918 max_received_linelength = linelength;
919 linelength = -1;
920 break;
921
922 case 0:
923 body_zerocount++;
924 /*FALLTHROUGH*/
925 default:
926 message_size++;
927 linelength++;
928 if (fout)
929 {
930 if (fputc(ch, fout) == EOF) return END_WERROR;
931 if (message_size > thismessage_size_limit) return END_SIZE;
932 }
933#ifdef notyet
934 if(ch == '\n')
935 (void) cutthrough_put_nl();
936 else
937 {
938 uschar c = ch;
939 (void) cutthrough_puts(&c, 1);
940 }
941#endif
942 break;
943 }
944/*NOTREACHED*/
945}
946
947
948
949
059ec3d9
PH
950/*************************************************
951* Swallow SMTP message *
952*************************************************/
953
954/* This function is called when there has been some kind of error while reading
955an SMTP message, and the remaining data may need to be swallowed. It is global
956because it is called from smtp_closedown() to shut down an incoming call
957tidily.
958
959Argument: a FILE from which to read the message
960Returns: nothing
961*/
962
963void
964receive_swallow_smtp(void)
965{
7e3ce68e 966/*XXX CHUNKING: not enough. read chunks until RSET? */
059ec3d9
PH
967if (message_ended >= END_NOTENDED)
968 message_ended = read_message_data_smtp(NULL);
969}
970
971
972
973/*************************************************
974* Handle lost SMTP connection *
975*************************************************/
976
977/* This function logs connection loss incidents and generates an appropriate
978SMTP response.
979
980Argument: additional data for the message
981Returns: the SMTP response
982*/
983
984static uschar *
985handle_lost_connection(uschar *s)
986{
987log_write(L_lost_incoming_connection | L_smtp_connection, LOG_MAIN,
988 "%s lost while reading message data%s", smtp_get_connection_info(), s);
989return US"421 Lost incoming connection";
990}
991
992
993
994
995/*************************************************
996* Handle a non-smtp reception error *
997*************************************************/
998
999/* This function is called for various errors during the reception of non-SMTP
1000messages. It either sends a message to the sender of the problem message, or it
1001writes to the standard error stream.
1002
1003Arguments:
1004 errcode code for moan_to_sender(), identifying the error
1005 text1 first message text, passed to moan_to_sender()
1006 text2 second message text, used only for stderrr
1007 error_rc code to pass to exim_exit if no problem
1008 f FILE containing body of message (may be stdin)
1009 hptr pointer to instore headers or NULL
1010
1011Returns: calls exim_exit(), which does not return
1012*/
1013
1014static void
1015give_local_error(int errcode, uschar *text1, uschar *text2, int error_rc,
1016 FILE *f, header_line *hptr)
1017{
1018if (error_handling == ERRORS_SENDER)
1019 {
1020 error_block eblock;
1021 eblock.next = NULL;
1022 eblock.text1 = text1;
37f3dc43 1023 eblock.text2 = US"";
059ec3d9
PH
1024 if (!moan_to_sender(errcode, &eblock, hptr, f, FALSE))
1025 error_rc = EXIT_FAILURE;
1026 }
37f3dc43
JH
1027else
1028 fprintf(stderr, "exim: %s%s\n", text2, text1); /* Sic */
f1e894f3 1029(void)fclose(f);
059ec3d9
PH
1030exim_exit(error_rc);
1031}
1032
1033
1034
1035/*************************************************
1036* Add header lines set up by ACL *
1037*************************************************/
1038
850635b6
PH
1039/* This function is called to add the header lines that were set up by
1040statements in an ACL to the list of headers in memory. It is done in two stages
1041like this, because when the ACL for RCPT is running, the other headers have not
1042yet been received. This function is called twice; once just before running the
1043DATA ACL, and once after. This is so that header lines added by MAIL or RCPT
1044are visible to the DATA ACL.
059ec3d9
PH
1045
1046Originally these header lines were added at the end. Now there is support for
1047three different places: top, bottom, and after the Received: header(s). There
1048will always be at least one Received: header, even if it is marked deleted, and
1049even if something else has been put in front of it.
1050
1051Arguments:
1052 acl_name text to identify which ACL
1053
1054Returns: nothing
1055*/
1056
1057static void
578d43dc 1058add_acl_headers(int where, uschar *acl_name)
059ec3d9
PH
1059{
1060header_line *h, *next;
1061header_line *last_received = NULL;
e7568d51 1062
578d43dc
JH
1063switch(where)
1064 {
1065 case ACL_WHERE_DKIM:
1066 case ACL_WHERE_MIME:
af4a1bca 1067 case ACL_WHERE_DATA:
5032d1cf 1068 if (cutthrough.fd >= 0 && (acl_removed_headers || acl_added_headers))
578d43dc
JH
1069 {
1070 log_write(0, LOG_MAIN|LOG_PANIC, "Header modification in data ACLs"
af4a1bca 1071 " will not take effect on cutthrough deliveries");
578d43dc
JH
1072 return;
1073 }
1074 }
1075
e7568d51
TL
1076if (acl_removed_headers != NULL)
1077 {
1078 DEBUG(D_receive|D_acl) debug_printf(">>Headers removed by %s ACL:\n", acl_name);
1079
4a142059 1080 for (h = header_list; h != NULL; h = h->next) if (h->type != htype_old)
e7568d51 1081 {
55414b25 1082 const uschar * list = acl_removed_headers;
e7568d51
TL
1083 int sep = ':'; /* This is specified as a colon-separated list */
1084 uschar *s;
1085 uschar buffer[128];
4a142059
JH
1086
1087 while ((s = string_nextinlist(&list, &sep, buffer, sizeof(buffer))))
1088 if (header_testname(h, s, Ustrlen(s), FALSE))
e7568d51
TL
1089 {
1090 h->type = htype_old;
1091 DEBUG(D_receive|D_acl) debug_printf(" %s", h->text);
1092 }
e7568d51
TL
1093 }
1094 acl_removed_headers = NULL;
1095 DEBUG(D_receive|D_acl) debug_printf(">>\n");
1096 }
059ec3d9 1097
71fafd95 1098if (acl_added_headers == NULL) return;
059ec3d9
PH
1099DEBUG(D_receive|D_acl) debug_printf(">>Headers added by %s ACL:\n", acl_name);
1100
71fafd95 1101for (h = acl_added_headers; h != NULL; h = next)
059ec3d9
PH
1102 {
1103 next = h->next;
1104
1105 switch(h->type)
1106 {
1107 case htype_add_top:
1108 h->next = header_list;
1109 header_list = h;
1110 DEBUG(D_receive|D_acl) debug_printf(" (at top)");
1111 break;
1112
1113 case htype_add_rec:
1114 if (last_received == NULL)
1115 {
1116 last_received = header_list;
1117 while (!header_testname(last_received, US"Received", 8, FALSE))
1118 last_received = last_received->next;
1119 while (last_received->next != NULL &&
1120 header_testname(last_received->next, US"Received", 8, FALSE))
1121 last_received = last_received->next;
1122 }
1123 h->next = last_received->next;
1124 last_received->next = h;
1125 DEBUG(D_receive|D_acl) debug_printf(" (after Received:)");
1126 break;
1127
8523533c
TK
1128 case htype_add_rfc:
1129 /* add header before any header which is NOT Received: or Resent- */
1130 last_received = header_list;
1131 while ( (last_received->next != NULL) &&
1132 ( (header_testname(last_received->next, US"Received", 8, FALSE)) ||
1133 (header_testname_incomplete(last_received->next, US"Resent-", 7, FALSE)) ) )
1134 last_received = last_received->next;
1135 /* last_received now points to the last Received: or Resent-* header
1136 in an uninterrupted chain of those header types (seen from the beginning
1137 of all headers. Our current header must follow it. */
1138 h->next = last_received->next;
1139 last_received->next = h;
8e669ac1 1140 DEBUG(D_receive|D_acl) debug_printf(" (before any non-Received: or Resent-*: header)");
8523533c
TK
1141 break;
1142
059ec3d9
PH
1143 default:
1144 h->next = NULL;
1145 header_last->next = h;
1146 break;
1147 }
1148
1149 if (h->next == NULL) header_last = h;
1150
1151 /* Check for one of the known header types (From:, To:, etc.) though in
1152 practice most added headers are going to be "other". Lower case
1153 identification letters are never stored with the header; they are used
1154 for existence tests when messages are received. So discard any lower case
1155 flag values. */
1156
1157 h->type = header_checkname(h, FALSE);
1158 if (h->type >= 'a') h->type = htype_other;
1159
1160 DEBUG(D_receive|D_acl) debug_printf(" %s", header_last->text);
1161 }
1162
71fafd95 1163acl_added_headers = NULL;
059ec3d9
PH
1164DEBUG(D_receive|D_acl) debug_printf(">>\n");
1165}
1166
1167
1168
1169/*************************************************
1170* Add host information for log line *
1171*************************************************/
1172
1173/* Called for acceptance and rejecting log lines. This adds information about
1174the calling host to a string that is being built dynamically.
1175
1176Arguments:
1177 s the dynamic string
1178 sizeptr points to the size variable
1179 ptrptr points to the pointer variable
1180
1181Returns: the extended string
1182*/
1183
1184static uschar *
fc16abb4 1185add_host_info_for_log(uschar * s, int * sizeptr, int * ptrptr)
059ec3d9 1186{
fc16abb4 1187if (sender_fullhost)
059ec3d9 1188 {
fc16abb4
JH
1189 if (LOGGING(dnssec) && sender_host_dnssec) /*XXX sender_helo_dnssec? */
1190 s = string_cat(s, sizeptr, ptrptr, US" DS");
059ec3d9 1191 s = string_append(s, sizeptr, ptrptr, 2, US" H=", sender_fullhost);
6c6d6e48 1192 if (LOGGING(incoming_interface) && interface_address != NULL)
059ec3d9 1193 {
fc16abb4
JH
1194 s = string_cat(s, sizeptr, ptrptr,
1195 string_sprintf(" I=[%s]:%d", interface_address, interface_port));
059ec3d9
PH
1196 }
1197 }
1198if (sender_ident != NULL)
1199 s = string_append(s, sizeptr, ptrptr, 2, US" U=", sender_ident);
1200if (received_protocol != NULL)
1201 s = string_append(s, sizeptr, ptrptr, 2, US" P=", received_protocol);
1202return s;
1203}
1204
1205
1206
63955bf2 1207#ifdef WITH_CONTENT_SCAN
059ec3d9 1208
54cdb463
PH
1209/*************************************************
1210* Run the MIME ACL on a message *
1211*************************************************/
1212
1213/* This code is in a subroutine so that it can be used for both SMTP
1214and non-SMTP messages. It is called with a non-NULL ACL pointer.
1215
1216Arguments:
1217 acl The ACL to run (acl_smtp_mime or acl_not_smtp_mime)
1218 smtp_yield_ptr Set FALSE to kill messages after dropped connection
1219 smtp_reply_ptr Where SMTP reply is being built
1220 blackholed_by_ptr Where "blackholed by" message is being built
1221
1222Returns: TRUE to carry on; FALSE to abandon the message
1223*/
1224
1225static BOOL
1226run_mime_acl(uschar *acl, BOOL *smtp_yield_ptr, uschar **smtp_reply_ptr,
1227 uschar **blackholed_by_ptr)
1228{
1229FILE *mbox_file;
1230uschar rfc822_file_path[2048];
1231unsigned long mbox_size;
1232header_line *my_headerlist;
1233uschar *user_msg, *log_msg;
1234int mime_part_count_buffer = -1;
7156b1ef 1235int rc = OK;
54cdb463
PH
1236
1237memset(CS rfc822_file_path,0,2048);
1238
1239/* check if it is a MIME message */
1240my_headerlist = header_list;
4e88a19f
PH
1241while (my_headerlist != NULL)
1242 {
54cdb463 1243 /* skip deleted headers */
4e88a19f
PH
1244 if (my_headerlist->type == '*')
1245 {
54cdb463
PH
1246 my_headerlist = my_headerlist->next;
1247 continue;
4e88a19f
PH
1248 }
1249 if (strncmpic(my_headerlist->text, US"Content-Type:", 13) == 0)
1250 {
54cdb463
PH
1251 DEBUG(D_receive) debug_printf("Found Content-Type: header - executing acl_smtp_mime.\n");
1252 goto DO_MIME_ACL;
4e88a19f 1253 }
54cdb463 1254 my_headerlist = my_headerlist->next;
4e88a19f 1255 }
54cdb463
PH
1256
1257DEBUG(D_receive) debug_printf("No Content-Type: header - presumably not a MIME message.\n");
1258return TRUE;
1259
1260DO_MIME_ACL:
1261/* make sure the eml mbox file is spooled up */
8544e77a 1262mbox_file = spool_mbox(&mbox_size, NULL);
54cdb463
PH
1263if (mbox_file == NULL) {
1264 /* error while spooling */
1265 log_write(0, LOG_MAIN|LOG_PANIC,
1266 "acl_smtp_mime: error while creating mbox spool file, message temporarily rejected.");
1267 Uunlink(spool_name);
1268 unspool_mbox();
6f0c431a
PP
1269#ifdef EXPERIMENTAL_DCC
1270 dcc_ok = 0;
1271#endif
a5bd321b 1272 smtp_respond(US"451", 3, TRUE, US"temporary local problem");
54cdb463
PH
1273 message_id[0] = 0; /* Indicate no message accepted */
1274 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1275 return FALSE; /* Indicate skip to end of receive function */
1276};
1277
1278mime_is_rfc822 = 0;
1279
1280MIME_ACL_CHECK:
1281mime_part_count = -1;
1282rc = mime_acl_check(acl, mbox_file, NULL, &user_msg, &log_msg);
f1e894f3 1283(void)fclose(mbox_file);
54cdb463 1284
4e88a19f
PH
1285if (Ustrlen(rfc822_file_path) > 0)
1286 {
54cdb463
PH
1287 mime_part_count = mime_part_count_buffer;
1288
4e88a19f
PH
1289 if (unlink(CS rfc822_file_path) == -1)
1290 {
54cdb463
PH
1291 log_write(0, LOG_PANIC,
1292 "acl_smtp_mime: can't unlink RFC822 spool file, skipping.");
1293 goto END_MIME_ACL;
4e88a19f
PH
1294 }
1295 }
54cdb463
PH
1296
1297/* check if we must check any message/rfc822 attachments */
4e88a19f
PH
1298if (rc == OK)
1299 {
54cdb463 1300 uschar temp_path[1024];
e8bc7fca
JH
1301 struct dirent * entry;
1302 DIR * tempdir;
54cdb463 1303
e8bc7fca
JH
1304 (void) string_format(temp_path, sizeof(temp_path), "%s/scan/%s",
1305 spool_directory, message_id);
54cdb463 1306
4e88a19f 1307 tempdir = opendir(CS temp_path);
e8bc7fca 1308 for (;;)
4e88a19f 1309 {
e8bc7fca
JH
1310 if (!(entry = readdir(tempdir)))
1311 break;
1312 if (strncmpic(US entry->d_name, US"__rfc822_", 9) == 0)
4e88a19f 1313 {
e8bc7fca
JH
1314 (void) string_format(rfc822_file_path, sizeof(rfc822_file_path),
1315 "%s/scan/%s/%s", spool_directory, message_id, entry->d_name);
1316 debug_printf("RFC822 attachment detected: running MIME ACL for '%s'\n",
1317 rfc822_file_path);
4e88a19f
PH
1318 break;
1319 }
e8bc7fca 1320 }
4e88a19f 1321 closedir(tempdir);
54cdb463 1322
e8bc7fca 1323 if (entry)
4e88a19f 1324 {
e8bc7fca 1325 if ((mbox_file = Ufopen(rfc822_file_path, "rb")))
4e88a19f 1326 {
e8bc7fca
JH
1327 /* set RFC822 expansion variable */
1328 mime_is_rfc822 = 1;
1329 mime_part_count_buffer = mime_part_count;
1330 goto MIME_ACL_CHECK;
4e88a19f 1331 }
e8bc7fca
JH
1332 log_write(0, LOG_PANIC,
1333 "acl_smtp_mime: can't open RFC822 spool file, skipping.");
1334 unlink(CS rfc822_file_path);
4e88a19f
PH
1335 }
1336 }
54cdb463
PH
1337
1338END_MIME_ACL:
578d43dc 1339add_acl_headers(ACL_WHERE_MIME, US"MIME");
54cdb463
PH
1340if (rc == DISCARD)
1341 {
1342 recipients_count = 0;
1343 *blackholed_by_ptr = US"MIME ACL";
1344 }
1345else if (rc != OK)
1346 {
1347 Uunlink(spool_name);
1348 unspool_mbox();
6f0c431a
PP
1349#ifdef EXPERIMENTAL_DCC
1350 dcc_ok = 0;
1351#endif
4f6ae5c3
JH
1352 if ( smtp_input
1353 && smtp_handle_acl_fail(ACL_WHERE_MIME, rc, user_msg, log_msg) != 0)
1354 {
85ffcba6 1355 *smtp_yield_ptr = FALSE; /* No more messages after dropped connection */
f4c1088b 1356 *smtp_reply_ptr = US""; /* Indicate reply already sent */
4f6ae5c3 1357 }
54cdb463
PH
1358 message_id[0] = 0; /* Indicate no message accepted */
1359 return FALSE; /* Cause skip to end of receive function */
4e88a19f 1360 }
54cdb463
PH
1361
1362return TRUE;
1363}
1364
63955bf2 1365#endif /* WITH_CONTENT_SCAN */
54cdb463
PH
1366
1367
e4bdf652
JH
1368
1369void
1370received_header_gen(void)
1371{
1372uschar *received;
1373uschar *timestamp;
1374header_line *received_header= header_list;
1375
1376timestamp = expand_string(US"${tod_full}");
1377if (recipients_count == 1) received_for = recipients_list[0].address;
1378received = expand_string(received_header_text);
1379received_for = NULL;
1380
d4ff61d1 1381if (!received)
e4bdf652
JH
1382 {
1383 if(spool_name[0] != 0)
1384 Uunlink(spool_name); /* Lose the data file */
1385 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Expansion of \"%s\" "
1386 "(received_header_text) failed: %s", string_printing(received_header_text),
1387 expand_string_message);
1388 }
1389
1390/* The first element on the header chain is reserved for the Received header,
1391so all we have to do is fill in the text pointer, and set the type. However, if
1392the result of the expansion is an empty string, we leave the header marked as
1393"old" so as to refrain from adding a Received header. */
1394
1395if (received[0] == 0)
1396 {
1397 received_header->text = string_sprintf("Received: ; %s\n", timestamp);
1398 received_header->type = htype_old;
1399 }
1400else
1401 {
1402 received_header->text = string_sprintf("%s; %s\n", received, timestamp);
1403 received_header->type = htype_received;
1404 }
1405
1406received_header->slen = Ustrlen(received_header->text);
1407
1408DEBUG(D_receive) debug_printf(">>Generated Received: header line\n%c %s",
1409 received_header->type, received_header->text);
1410}
1411
1412
1413
059ec3d9
PH
1414/*************************************************
1415* Receive message *
1416*************************************************/
1417
1418/* Receive a message on the given input, and put it into a pair of spool files.
1419Either a non-null list of recipients, or the extract flag will be true, or
1420both. The flag sender_local is true for locally generated messages. The flag
1421submission_mode is true if an ACL has obeyed "control = submission". The flag
8800895a 1422suppress_local_fixups is true if an ACL has obeyed "control =
f4ee74ac
PP
1423suppress_local_fixups" or -G was passed on the command-line.
1424The flag smtp_input is true if the message is to be
8800895a
PH
1425handled using SMTP conventions about termination and lines starting with dots.
1426For non-SMTP messages, dot_ends is true for dot-terminated messages.
059ec3d9
PH
1427
1428If a message was successfully read, message_id[0] will be non-zero.
1429
1430The general actions of this function are:
1431
1432 . Read the headers of the message (if any) into a chain of store
1433 blocks.
1434
1435 . If there is a "sender:" header and the message is locally originated,
69358f02
PH
1436 throw it away, unless the caller is trusted, or unless
1437 active_local_sender_retain is set - which can only happen if
1438 active_local_from_check is false.
059ec3d9
PH
1439
1440 . If recipients are to be extracted from the message, build the
1441 recipients list from the headers, removing any that were on the
1442 original recipients list (unless extract_addresses_remove_arguments is
1443 false), and at the same time, remove any bcc header that may be present.
1444
1445 . Get the spool file for the data, sort out its unique name, open
1446 and lock it (but don't give it the name yet).
1447
1448 . Generate a "Message-Id" header if the message doesn't have one, for
1449 locally-originated messages.
1450
1451 . Generate a "Received" header.
1452
1453 . Ensure the recipients list is fully qualified and rewritten if necessary.
1454
1455 . If there are any rewriting rules, apply them to the sender address
1456 and also to the headers.
1457
1458 . If there is no from: header, generate one, for locally-generated messages
1459 and messages in "submission mode" only.
1460
1461 . If the sender is local, check that from: is correct, and if not, generate
1462 a Sender: header, unless message comes from a trusted caller, or this
69358f02 1463 feature is disabled by active_local_from_check being false.
059ec3d9
PH
1464
1465 . If there is no "date" header, generate one, for locally-originated
1466 or submission mode messages only.
1467
1468 . Copy the rest of the input, or up to a terminating "." if in SMTP or
1469 dot_ends mode, to the data file. Leave it open, to hold the lock.
1470
1471 . Write the envelope and the headers to a new file.
1472
1473 . Set the name for the header file; close it.
1474
1475 . Set the name for the data file; close it.
1476
1477Because this function can potentially be called many times in a single
1478SMTP connection, all store should be got by store_get(), so that it will be
1479automatically retrieved after the message is accepted.
1480
1481FUDGE: It seems that sites on the net send out messages with just LF
1482terminators, despite the warnings in the RFCs, and other MTAs handle this. So
1483we make the CRs optional in all cases.
1484
1485July 2003: Bare CRs in messages, especially in header lines, cause trouble. A
1486new regime is now in place in which bare CRs in header lines are turned into LF
1487followed by a space, so as not to terminate the header line.
1488
1489February 2004: A bare LF in a header line in a message whose first line was
1490terminated by CRLF is treated in the same way as a bare CR.
1491
1492Arguments:
1493 extract_recip TRUE if recipients are to be extracted from the message's
1494 headers
1495
1496Returns: TRUE there are more messages to be read (SMTP input)
1497 FALSE there are no more messages to be read (non-SMTP input
1498 or SMTP connection collapsed, or other failure)
1499
1500When reading a message for filter testing, the returned value indicates
1501whether the headers (which is all that is read) were terminated by '.' or
1502not. */
1503
1504BOOL
1505receive_msg(BOOL extract_recip)
1506{
7156b1ef
NM
1507int i;
1508int rc = FAIL;
059ec3d9
PH
1509int msg_size = 0;
1510int process_info_len = Ustrlen(process_info);
1511int error_rc = (error_handling == ERRORS_SENDER)?
1512 errors_sender_rc : EXIT_FAILURE;
1513int header_size = 256;
1514int start, end, domain, size, sptr;
1515int id_resolution;
1516int had_zero = 0;
d677b2f2 1517int prevlines_length = 0;
059ec3d9
PH
1518
1519register int ptr = 0;
1520
1521BOOL contains_resent_headers = FALSE;
1522BOOL extracted_ignored = FALSE;
1523BOOL first_line_ended_crlf = TRUE_UNSET;
1524BOOL smtp_yield = TRUE;
1525BOOL yield = FALSE;
1526
1527BOOL resents_exist = FALSE;
1528uschar *resent_prefix = US"";
1529uschar *blackholed_by = NULL;
04f7d5b9 1530uschar *blackhole_log_msg = US"";
c5430c20 1531enum {NOT_TRIED, TMP_REJ, PERM_REJ, ACCEPTED} cutthrough_done = NOT_TRIED;
059ec3d9
PH
1532
1533flock_t lock_data;
1534error_block *bad_addresses = NULL;
1535
1536uschar *frozen_by = NULL;
1537uschar *queued_by = NULL;
1538
1539uschar *errmsg, *s;
1540struct stat statbuf;
1541
4e88a19f 1542/* Final message to give to SMTP caller, and messages from ACLs */
059ec3d9
PH
1543
1544uschar *smtp_reply = NULL;
4e88a19f 1545uschar *user_msg, *log_msg;
059ec3d9
PH
1546
1547/* Working header pointers */
1548
1549header_line *h, *next;
1550
2cbb4081 1551/* Flags for noting the existence of certain headers (only one left) */
059ec3d9
PH
1552
1553BOOL date_header_exists = FALSE;
1554
1555/* Pointers to receive the addresses of headers whose contents we need. */
1556
1557header_line *from_header = NULL;
1558header_line *subject_header = NULL;
1559header_line *msgid_header = NULL;
1560header_line *received_header;
1561
4840604e
TL
1562#ifdef EXPERIMENTAL_DMARC
1563int dmarc_up = 0;
1564#endif /* EXPERIMENTAL_DMARC */
1565
059ec3d9
PH
1566/* Variables for use when building the Received: header. */
1567
059ec3d9
PH
1568uschar *timestamp;
1569int tslen;
1570
1571/* Release any open files that might have been cached while preparing to
1572accept the message - e.g. by verifying addresses - because reading a message
1573might take a fair bit of real time. */
1574
1575search_tidyup();
1576
e4bdf652
JH
1577/* Extracting the recipient list from an input file is incompatible with
1578cutthrough delivery with the no-spool option. It shouldn't be possible
817d9f57 1579to set up the combination, but just in case kill any ongoing connection. */
e4bdf652 1580if (extract_recip || !smtp_input)
2e5b33cd 1581 cancel_cutthrough_connection("not smtp input");
e4bdf652 1582
059ec3d9
PH
1583/* Initialize the chain of headers by setting up a place-holder for Received:
1584header. Temporarily mark it as "old", i.e. not to be used. We keep header_last
1585pointing to the end of the chain to make adding headers simple. */
1586
1587received_header = header_list = header_last = store_get(sizeof(header_line));
1588header_list->next = NULL;
1589header_list->type = htype_old;
1590header_list->text = NULL;
1591header_list->slen = 0;
1592
1593/* Control block for the next header to be read. */
1594
1595next = store_get(sizeof(header_line));
1596next->text = store_get(header_size);
1597
1598/* Initialize message id to be null (indicating no message read), and the
1599header names list to be the normal list. Indicate there is no data file open
1600yet, initialize the size and warning count, and deal with no size limit. */
1601
1602message_id[0] = 0;
1603data_file = NULL;
1604data_fd = -1;
41313d92 1605spool_name = US"";
059ec3d9
PH
1606message_size = 0;
1607warning_count = 0;
d677b2f2 1608received_count = 1; /* For the one we will add */
059ec3d9
PH
1609
1610if (thismessage_size_limit <= 0) thismessage_size_limit = INT_MAX;
1611
2e0c1448 1612/* While reading the message, the following counts are computed. */
059ec3d9 1613
d677b2f2
PH
1614message_linecount = body_linecount = body_zerocount =
1615 max_received_linelength = 0;
059ec3d9 1616
80a47a2c 1617#ifndef DISABLE_DKIM
e983e85a
JH
1618/* Call into DKIM to set up the context. In CHUNKING mode
1619we clear the dot-stuffing flag */
1620if (smtp_input && !smtp_batched_input && !dkim_disable_verify)
1621 dkim_exim_verify_init(chunking_state <= CHUNKING_OFFERED);
fb2274d4
TK
1622#endif
1623
4840604e
TL
1624#ifdef EXPERIMENTAL_DMARC
1625/* initialize libopendmarc */
1626dmarc_up = dmarc_init();
1627#endif
1628
059ec3d9
PH
1629/* Remember the time of reception. Exim uses time+pid for uniqueness of message
1630ids, and fractions of a second are required. See the comments that precede the
1631message id creation below. */
1632
1633(void)gettimeofday(&message_id_tv, NULL);
1634
1635/* For other uses of the received time we can operate with granularity of one
1636second, and for that we use the global variable received_time. This is for
1637things like ultimate message timeouts. */
1638
1639received_time = message_id_tv.tv_sec;
1640
1641/* If SMTP input, set the special handler for timeouts. The alarm() calls
1642happen in the smtp_getc() function when it refills its buffer. */
1643
1644if (smtp_input) os_non_restarting_signal(SIGALRM, data_timeout_handler);
1645
1646/* If not SMTP input, timeout happens only if configured, and we just set a
1647single timeout for the whole message. */
1648
1649else if (receive_timeout > 0)
1650 {
1651 os_non_restarting_signal(SIGALRM, data_timeout_handler);
1652 alarm(receive_timeout);
1653 }
1654
1655/* SIGTERM and SIGINT are caught always. */
1656
1657signal(SIGTERM, data_sigterm_sigint_handler);
1658signal(SIGINT, data_sigterm_sigint_handler);
1659
1660/* Header lines in messages are not supposed to be very long, though when
1661unfolded, to: and cc: headers can take up a lot of store. We must also cope
1662with the possibility of junk being thrown at us. Start by getting 256 bytes for
1663storing the header, and extend this as necessary using string_cat().
1664
1665To cope with total lunacies, impose an upper limit on the length of the header
1666section of the message, as otherwise the store will fill up. We must also cope
1667with the possibility of binary zeros in the data. Hence we cannot use fgets().
1668Folded header lines are joined into one string, leaving the '\n' characters
1669inside them, so that writing them out reproduces the input.
1670
1671Loop for each character of each header; the next structure for chaining the
1672header is set up already, with ptr the offset of the next character in
1673next->text. */
1674
1675for (;;)
1676 {
80a47a2c 1677 int ch = (receive_getc)();
059ec3d9
PH
1678
1679 /* If we hit EOF on a SMTP connection, it's an error, since incoming
1680 SMTP must have a correct "." terminator. */
1681
1682 if (ch == EOF && smtp_input /* && !smtp_batched_input */)
1683 {
1684 smtp_reply = handle_lost_connection(US" (header)");
1685 smtp_yield = FALSE;
1686 goto TIDYUP; /* Skip to end of function */
1687 }
1688
1689 /* See if we are at the current header's size limit - there must be at least
1690 four bytes left. This allows for the new character plus a zero, plus two for
1691 extra insertions when we are playing games with dots and carriage returns. If
1692 we are at the limit, extend the text buffer. This could have been done
1693 automatically using string_cat() but because this is a tightish loop storing
1694 only one character at a time, we choose to do it inline. Normally
1695 store_extend() will be able to extend the block; only at the end of a big
1696 store block will a copy be needed. To handle the case of very long headers
1697 (and sometimes lunatic messages can have ones that are 100s of K long) we
1698 call store_release() for strings that have been copied - if the string is at
1699 the start of a block (and therefore the only thing in it, because we aren't
1700 doing any other gets), the block gets freed. We can only do this because we
1701 know there are no other calls to store_get() going on. */
1702
1703 if (ptr >= header_size - 4)
1704 {
1705 int oldsize = header_size;
1706 /* header_size += 256; */
1707 header_size *= 2;
1708 if (!store_extend(next->text, oldsize, header_size))
1709 {
1710 uschar *newtext = store_get(header_size);
1711 memcpy(newtext, next->text, ptr);
1712 store_release(next->text);
1713 next->text = newtext;
1714 }
1715 }
1716
1717 /* Cope with receiving a binary zero. There is dispute about whether
1718 these should be allowed in RFC 822 messages. The middle view is that they
1719 should not be allowed in headers, at least. Exim takes this attitude at
1720 the moment. We can't just stomp on them here, because we don't know that
1721 this line is a header yet. Set a flag to cause scanning later. */
1722
1723 if (ch == 0) had_zero++;
1724
1725 /* Test for termination. Lines in remote SMTP are terminated by CRLF, while
1726 those from data files use just LF. Treat LF in local SMTP input as a
1727 terminator too. Treat EOF as a line terminator always. */
1728
1729 if (ch == EOF) goto EOL;
1730
1731 /* FUDGE: There are sites out there that don't send CRs before their LFs, and
1732 other MTAs accept this. We are therefore forced into this "liberalisation"
1733 too, so we accept LF as a line terminator whatever the source of the message.
1734 However, if the first line of the message ended with a CRLF, we treat a bare
1735 LF specially by inserting a white space after it to ensure that the header
1736 line is not terminated. */
1737
1738 if (ch == '\n')
1739 {
1740 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = FALSE;
80a47a2c 1741 else if (first_line_ended_crlf) receive_ungetc(' ');
059ec3d9
PH
1742 goto EOL;
1743 }
1744
1745 /* This is not the end of the line. If this is SMTP input and this is
1746 the first character in the line and it is a "." character, ignore it.
1747 This implements the dot-doubling rule, though header lines starting with
1748 dots aren't exactly common. They are legal in RFC 822, though. If the
1749 following is CRLF or LF, this is the line that that terminates the
1750 entire message. We set message_ended to indicate this has happened (to
1751 prevent further reading), and break out of the loop, having freed the
1752 empty header, and set next = NULL to indicate no data line. */
1753
1754 if (ptr == 0 && ch == '.' && (smtp_input || dot_ends))
1755 {
80a47a2c 1756 ch = (receive_getc)();
059ec3d9
PH
1757 if (ch == '\r')
1758 {
80a47a2c 1759 ch = (receive_getc)();
059ec3d9
PH
1760 if (ch != '\n')
1761 {
80a47a2c 1762 receive_ungetc(ch);
059ec3d9
PH
1763 ch = '\r'; /* Revert to CR */
1764 }
1765 }
1766 if (ch == '\n')
1767 {
1768 message_ended = END_DOT;
1769 store_reset(next);
1770 next = NULL;
1771 break; /* End character-reading loop */
1772 }
1773
1774 /* For non-SMTP input, the dot at the start of the line was really a data
1775 character. What is now in ch is the following character. We guaranteed
1776 enough space for this above. */
1777
1778 if (!smtp_input)
1779 {
1780 next->text[ptr++] = '.';
1781 message_size++;
1782 }
1783 }
1784
1785 /* If CR is immediately followed by LF, end the line, ignoring the CR, and
1786 remember this case if this is the first line ending. */
1787
1788 if (ch == '\r')
1789 {
80a47a2c 1790 ch = (receive_getc)();
059ec3d9
PH
1791 if (ch == '\n')
1792 {
1793 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = TRUE;
1794 goto EOL;
1795 }
1796
1797 /* Otherwise, put back the character after CR, and turn the bare CR
1798 into LF SP. */
1799
80a47a2c 1800 ch = (receive_ungetc)(ch);
059ec3d9
PH
1801 next->text[ptr++] = '\n';
1802 message_size++;
1803 ch = ' ';
1804 }
1805
1806 /* We have a data character for the header line. */
1807
1808 next->text[ptr++] = ch; /* Add to buffer */
1809 message_size++; /* Total message size so far */
1810
1811 /* Handle failure due to a humungously long header section. The >= allows
1812 for the terminating \n. Add what we have so far onto the headers list so
1813 that it gets reflected in any error message, and back up the just-read
1814 character. */
1815
1816 if (message_size >= header_maxsize)
1817 {
1818 next->text[ptr] = 0;
1819 next->slen = ptr;
1820 next->type = htype_other;
1821 next->next = NULL;
1822 header_last->next = next;
1823 header_last = next;
1824
1825 log_write(0, LOG_MAIN, "ridiculously long message header received from "
1826 "%s (more than %d characters): message abandoned",
1827 sender_host_unknown? sender_ident : sender_fullhost, header_maxsize);
1828
1829 if (smtp_input)
1830 {
1831 smtp_reply = US"552 Message header is ridiculously long";
1832 receive_swallow_smtp();
1833 goto TIDYUP; /* Skip to end of function */
1834 }
1835
1836 else
1837 {
1838 give_local_error(ERRMESS_VLONGHEADER,
1839 string_sprintf("message header longer than %d characters received: "
1840 "message not accepted", header_maxsize), US"", error_rc, stdin,
1841 header_list->next);
1842 /* Does not return */
1843 }
1844 }
1845
1846 continue; /* With next input character */
1847
1848 /* End of header line reached */
1849
1850 EOL:
2e0c1448
PH
1851
1852 /* Keep track of lines for BSMTP errors and overall message_linecount. */
1853
1854 receive_linecount++;
1855 message_linecount++;
059ec3d9 1856
d677b2f2
PH
1857 /* Keep track of maximum line length */
1858
1859 if (ptr - prevlines_length > max_received_linelength)
1860 max_received_linelength = ptr - prevlines_length;
1861 prevlines_length = ptr + 1;
1862
059ec3d9
PH
1863 /* Now put in the terminating newline. There is always space for
1864 at least two more characters. */
1865
1866 next->text[ptr++] = '\n';
1867 message_size++;
1868
1869 /* A blank line signals the end of the headers; release the unwanted
1870 space and set next to NULL to indicate this. */
1871
1872 if (ptr == 1)
1873 {
1874 store_reset(next);
1875 next = NULL;
1876 break;
1877 }
1878
1879 /* There is data in the line; see if the next input character is a
1880 whitespace character. If it is, we have a continuation of this header line.
1881 There is always space for at least one character at this point. */
1882
1883 if (ch != EOF)
1884 {
80a47a2c 1885 int nextch = (receive_getc)();
059ec3d9
PH
1886 if (nextch == ' ' || nextch == '\t')
1887 {
1888 next->text[ptr++] = nextch;
1889 message_size++;
1890 continue; /* Iterate the loop */
1891 }
80a47a2c 1892 else if (nextch != EOF) (receive_ungetc)(nextch); /* For next time */
059ec3d9
PH
1893 else ch = EOF; /* Cause main loop to exit at end */
1894 }
1895
1896 /* We have got to the real line end. Terminate the string and release store
1897 beyond it. If it turns out to be a real header, internal binary zeros will
1898 be squashed later. */
1899
1900 next->text[ptr] = 0;
1901 next->slen = ptr;
1902 store_reset(next->text + ptr + 1);
1903
1904 /* Check the running total size against the overall message size limit. We
1905 don't expect to fail here, but if the overall limit is set less than MESSAGE_
1906 MAXSIZE and a big header is sent, we want to catch it. Just stop reading
1907 headers - the code to read the body will then also hit the buffer. */
1908
1909 if (message_size > thismessage_size_limit) break;
1910
1911 /* A line that is not syntactically correct for a header also marks
1912 the end of the headers. In this case, we leave next containing the
1913 first data line. This might actually be several lines because of the
1914 continuation logic applied above, but that doesn't matter.
1915
1916 It turns out that smail, and presumably sendmail, accept leading lines
1917 of the form
1918
1919 From ph10 Fri Jan 5 12:35 GMT 1996
1920
1921 in messages. The "mail" command on Solaris 2 sends such lines. I cannot
1922 find any documentation of this, but for compatibility it had better be
1923 accepted. Exim restricts it to the case of non-smtp messages, and
1924 treats it as an alternative to the -f command line option. Thus it is
1925 ignored except for trusted users or filter testing. Otherwise it is taken
1926 as the sender address, unless -f was used (sendmail compatibility).
1927
1928 It further turns out that some UUCPs generate the From_line in a different
1929 format, e.g.
1930
1931 From ph10 Fri, 7 Jan 97 14:00:00 GMT
1932
1933 The regex for matching these things is now capable of recognizing both
1934 formats (including 2- and 4-digit years in the latter). In fact, the regex
1935 is now configurable, as is the expansion string to fish out the sender.
1936
1937 Even further on it has been discovered that some broken clients send
1938 these lines in SMTP messages. There is now an option to ignore them from
1939 specified hosts or networks. Sigh. */
1940
1941 if (header_last == header_list &&
1942 (!smtp_input
1943 ||
1944 (sender_host_address != NULL &&
1945 verify_check_host(&ignore_fromline_hosts) == OK)
1946 ||
1947 (sender_host_address == NULL && ignore_fromline_local)
1948 ) &&
1949 regex_match_and_setup(regex_From, next->text, 0, -1))
1950 {
1951 if (!sender_address_forced)
1952 {
1953 uschar *uucp_sender = expand_string(uucp_from_sender);
1954 if (uucp_sender == NULL)
1955 {
1956 log_write(0, LOG_MAIN|LOG_PANIC,
1957 "expansion of \"%s\" failed after matching "
1958 "\"From \" line: %s", uucp_from_sender, expand_string_message);
1959 }
1960 else
1961 {
1962 int start, end, domain;
1963 uschar *errmess;
1964 uschar *newsender = parse_extract_address(uucp_sender, &errmess,
1965 &start, &end, &domain, TRUE);
1966 if (newsender != NULL)
1967 {
1968 if (domain == 0 && newsender[0] != 0)
1969 newsender = rewrite_address_qualify(newsender, FALSE);
1970
f05da2e8 1971 if (filter_test != FTEST_NONE || receive_check_set_sender(newsender))
059ec3d9
PH
1972 {
1973 sender_address = newsender;
1974
f05da2e8 1975 if (trusted_caller || filter_test != FTEST_NONE)
059ec3d9
PH
1976 {
1977 authenticated_sender = NULL;
1978 originator_name = US"";
1979 sender_local = FALSE;
1980 }
1981
f05da2e8 1982 if (filter_test != FTEST_NONE)
059ec3d9
PH
1983 printf("Sender taken from \"From \" line\n");
1984 }
1985 }
1986 }
1987 }
1988 }
1989
1990 /* Not a leading "From " line. Check to see if it is a valid header line.
1991 Header names may contain any non-control characters except space and colon,
1992 amazingly. */
1993
1994 else
1995 {
1996 uschar *p = next->text;
1997
1998 /* If not a valid header line, break from the header reading loop, leaving
1999 next != NULL, indicating that it holds the first line of the body. */
2000
2001 if (isspace(*p)) break;
2002 while (mac_isgraph(*p) && *p != ':') p++;
2003 while (isspace(*p)) p++;
2004 if (*p != ':')
2005 {
2006 body_zerocount = had_zero;
2007 break;
2008 }
2009
2010 /* We have a valid header line. If there were any binary zeroes in
2011 the line, stomp on them here. */
2012
2013 if (had_zero > 0)
2014 for (p = next->text; p < next->text + ptr; p++) if (*p == 0) *p = '?';
2015
2016 /* It is perfectly legal to have an empty continuation line
2017 at the end of a header, but it is confusing to humans
2018 looking at such messages, since it looks like a blank line.
2019 Reduce confusion by removing redundant white space at the
2020 end. We know that there is at least one printing character
2021 (the ':' tested for above) so there is no danger of running
2022 off the end. */
2023
2024 p = next->text + ptr - 2;
2025 for (;;)
2026 {
2027 while (*p == ' ' || *p == '\t') p--;
2028 if (*p != '\n') break;
2029 ptr = (p--) - next->text + 1;
2030 message_size -= next->slen - ptr;
2031 next->text[ptr] = 0;
2032 next->slen = ptr;
2033 }
2034
2035 /* Add the header to the chain */
2036
2037 next->type = htype_other;
2038 next->next = NULL;
2039 header_last->next = next;
2040 header_last = next;
2041
2042 /* Check the limit for individual line lengths. This comes after adding to
2043 the chain so that the failing line is reflected if a bounce is generated
2044 (for a local message). */
2045
2046 if (header_line_maxsize > 0 && next->slen > header_line_maxsize)
2047 {
2048 log_write(0, LOG_MAIN, "overlong message header line received from "
2049 "%s (more than %d characters): message abandoned",
2050 sender_host_unknown? sender_ident : sender_fullhost,
2051 header_line_maxsize);
2052
2053 if (smtp_input)
2054 {
2055 smtp_reply = US"552 A message header line is too long";
2056 receive_swallow_smtp();
2057 goto TIDYUP; /* Skip to end of function */
2058 }
2059
2060 else
2061 {
2062 give_local_error(ERRMESS_VLONGHDRLINE,
2063 string_sprintf("message header line longer than %d characters "
2064 "received: message not accepted", header_line_maxsize), US"",
2065 error_rc, stdin, header_list->next);
2066 /* Does not return */
2067 }
2068 }
2069
2070 /* Note if any resent- fields exist. */
2071
2072 if (!resents_exist && strncmpic(next->text, US"resent-", 7) == 0)
2073 {
2074 resents_exist = TRUE;
2075 resent_prefix = US"Resent-";
2076 }
2077 }
2078
2079 /* The line has been handled. If we have hit EOF, break out of the loop,
2080 indicating no pending data line. */
2081
2082 if (ch == EOF) { next = NULL; break; }
2083
2084 /* Set up for the next header */
2085
2086 header_size = 256;
2087 next = store_get(sizeof(header_line));
2088 next->text = store_get(header_size);
2089 ptr = 0;
2090 had_zero = 0;
d677b2f2 2091 prevlines_length = 0;
059ec3d9
PH
2092 } /* Continue, starting to read the next header */
2093
2094/* At this point, we have read all the headers into a data structure in main
2095store. The first header is still the dummy placeholder for the Received: header
2096we are going to generate a bit later on. If next != NULL, it contains the first
2097data line - which terminated the headers before reaching a blank line (not the
2098normal case). */
2099
2100DEBUG(D_receive)
2101 {
2102 debug_printf(">>Headers received:\n");
2103 for (h = header_list->next; h != NULL; h = h->next)
2104 debug_printf("%s", h->text);
2105 debug_printf("\n");
2106 }
2107
2108/* End of file on any SMTP connection is an error. If an incoming SMTP call
2109is dropped immediately after valid headers, the next thing we will see is EOF.
2110We must test for this specially, as further down the reading of the data is
2111skipped if already at EOF. */
2112
2113if (smtp_input && (receive_feof)())
2114 {
2115 smtp_reply = handle_lost_connection(US" (after header)");
2116 smtp_yield = FALSE;
2117 goto TIDYUP; /* Skip to end of function */
2118 }
2119
2120/* If this is a filter test run and no headers were read, output a warning
2121in case there is a mistake in the test message. */
2122
f05da2e8 2123if (filter_test != FTEST_NONE && header_list->next == NULL)
059ec3d9
PH
2124 printf("Warning: no message headers read\n");
2125
2126
2127/* Scan the headers to identify them. Some are merely marked for later
2128processing; some are dealt with here. */
2129
2130for (h = header_list->next; h != NULL; h = h->next)
2131 {
2132 BOOL is_resent = strncmpic(h->text, US"resent-", 7) == 0;
2133 if (is_resent) contains_resent_headers = TRUE;
2134
2135 switch (header_checkname(h, is_resent))
2136 {
059ec3d9 2137 case htype_bcc:
2cbb4081 2138 h->type = htype_bcc; /* Both Bcc: and Resent-Bcc: */
059ec3d9
PH
2139 break;
2140
059ec3d9 2141 case htype_cc:
2cbb4081 2142 h->type = htype_cc; /* Both Cc: and Resent-Cc: */
059ec3d9
PH
2143 break;
2144
2145 /* Record whether a Date: or Resent-Date: header exists, as appropriate. */
2146
2147 case htype_date:
4c69d561 2148 if (!resents_exist || is_resent) date_header_exists = TRUE;
059ec3d9
PH
2149 break;
2150
2151 /* Same comments as about Return-Path: below. */
2152
2153 case htype_delivery_date:
2154 if (delivery_date_remove) h->type = htype_old;
2155 break;
2156
2157 /* Same comments as about Return-Path: below. */
2158
2159 case htype_envelope_to:
2160 if (envelope_to_remove) h->type = htype_old;
2161 break;
2162
2163 /* Mark all "From:" headers so they get rewritten. Save the one that is to
2164 be used for Sender: checking. For Sendmail compatibility, if the "From:"
2165 header consists of just the login id of the user who called Exim, rewrite
2166 it with the gecos field first. Apply this rule to Resent-From: if there
2167 are resent- fields. */
2168
2169 case htype_from:
2170 h->type = htype_from;
2171 if (!resents_exist || is_resent)
2172 {
2173 from_header = h;
2174 if (!smtp_input)
2175 {
5de8faa3 2176 int len;
059ec3d9
PH
2177 uschar *s = Ustrchr(h->text, ':') + 1;
2178 while (isspace(*s)) s++;
5de8faa3 2179 len = h->slen - (s - h->text) - 1;
e0fccd1d
TF
2180 if (Ustrlen(originator_login) == len &&
2181 strncmpic(s, originator_login, len) == 0)
059ec3d9
PH
2182 {
2183 uschar *name = is_resent? US"Resent-From" : US"From";
2184 header_add(htype_from, "%s: %s <%s@%s>\n", name, originator_name,
2185 originator_login, qualify_domain_sender);
2186 from_header = header_last;
2187 h->type = htype_old;
2188 DEBUG(D_receive|D_rewrite)
2189 debug_printf("rewrote \"%s:\" header using gecos\n", name);
2190 }
2191 }
2192 }
2193 break;
2194
2195 /* Identify the Message-id: header for generating "in-reply-to" in the
2196 autoreply transport. For incoming logging, save any resent- value. In both
2197 cases, take just the first of any multiples. */
2198
2199 case htype_id:
2200 if (msgid_header == NULL && (!resents_exist || is_resent))
2201 {
2202 msgid_header = h;
2203 h->type = htype_id;
2204 }
2205 break;
2206
2207 /* Flag all Received: headers */
2208
2209 case htype_received:
2210 h->type = htype_received;
2211 received_count++;
2212 break;
2213
2214 /* "Reply-to:" is just noted (there is no resent-reply-to field) */
2215
2216 case htype_reply_to:
2217 h->type = htype_reply_to;
2218 break;
2219
2220 /* The Return-path: header is supposed to be added to messages when
2221 they leave the SMTP system. We shouldn't receive messages that already
2222 contain Return-path. However, since Exim generates Return-path: on
2223 local delivery, resent messages may well contain it. We therefore
2224 provide an option (which defaults on) to remove any Return-path: headers
2225 on input. Removal actually means flagging as "old", which prevents the
2226 header being transmitted with the message. */
2227
2228 case htype_return_path:
2229 if (return_path_remove) h->type = htype_old;
2230
2231 /* If we are testing a mail filter file, use the value of the
2232 Return-Path: header to set up the return_path variable, which is not
2233 otherwise set. However, remove any <> that surround the address
2234 because the variable doesn't have these. */
2235
f05da2e8 2236 if (filter_test != FTEST_NONE)
059ec3d9
PH
2237 {
2238 uschar *start = h->text + 12;
2239 uschar *end = start + Ustrlen(start);
2240 while (isspace(*start)) start++;
2241 while (end > start && isspace(end[-1])) end--;
2242 if (*start == '<' && end[-1] == '>')
2243 {
2244 start++;
2245 end--;
2246 }
2247 return_path = string_copyn(start, end - start);
2248 printf("Return-path taken from \"Return-path:\" header line\n");
2249 }
2250 break;
2251
2252 /* If there is a "Sender:" header and the message is locally originated,
8800895a
PH
2253 and from an untrusted caller and suppress_local_fixups is not set, or if we
2254 are in submission mode for a remote message, mark it "old" so that it will
2255 not be transmitted with the message, unless active_local_sender_retain is
2256 set. (This can only be true if active_local_from_check is false.) If there
2257 are any resent- headers in the message, apply this rule to Resent-Sender:
2258 instead of Sender:. Messages with multiple resent- header sets cannot be
2259 tidily handled. (For this reason, at least one MUA - Pine - turns old
2260 resent- headers into X-resent- headers when resending, leaving just one
2261 set.) */
059ec3d9
PH
2262
2263 case htype_sender:
69358f02 2264 h->type = ((!active_local_sender_retain &&
8800895a
PH
2265 (
2266 (sender_local && !trusted_caller && !suppress_local_fixups)
2267 || submission_mode
2268 )
059ec3d9
PH
2269 ) &&
2270 (!resents_exist||is_resent))?
2271 htype_old : htype_sender;
2272 break;
2273
2274 /* Remember the Subject: header for logging. There is no Resent-Subject */
2275
2276 case htype_subject:
2277 subject_header = h;
2278 break;
2279
2280 /* "To:" gets flagged, and the existence of a recipient header is noted,
2281 whether it's resent- or not. */
2282
2283 case htype_to:
2284 h->type = htype_to;
2285 /****
2286 to_or_cc_header_exists = TRUE;
2287 ****/
2288 break;
2289 }
2290 }
2291
2292/* Extract recipients from the headers if that is required (the -t option).
2293Note that this is documented as being done *before* any address rewriting takes
2294place. There are two possibilities:
2295
2296(1) According to sendmail documentation for Solaris, IRIX, and HP-UX, any
2297recipients already listed are to be REMOVED from the message. Smail 3 works
2298like this. We need to build a non-recipients tree for that list, because in
2299subsequent processing this data is held in a tree and that's what the
2300spool_write_header() function expects. Make sure that non-recipient addresses
2301are fully qualified and rewritten if necessary.
2302
2303(2) According to other sendmail documentation, -t ADDS extracted recipients to
2304those in the command line arguments (and it is rumoured some other MTAs do
2305this). Therefore, there is an option to make Exim behave this way.
2306
2307*** Notes on "Resent-" header lines ***
2308
2309The presence of resent-headers in the message makes -t horribly ambiguous.
2310Experiments with sendmail showed that it uses recipients for all resent-
2311headers, totally ignoring the concept of "sets of resent- headers" as described
2312in RFC 2822 section 3.6.6. Sendmail also amalgamates them into a single set
2313with all the addresses in one instance of each header.
2314
2315This seems to me not to be at all sensible. Before release 4.20, Exim 4 gave an
2316error for -t if there were resent- headers in the message. However, after a
2317discussion on the mailing list, I've learned that there are MUAs that use
2318resent- headers with -t, and also that the stuff about sets of resent- headers
2319and their ordering in RFC 2822 is generally ignored. An MUA that submits a
2320message with -t and resent- header lines makes sure that only *its* resent-
2321headers are present; previous ones are often renamed as X-resent- for example.
2322
2323Consequently, Exim has been changed so that, if any resent- header lines are
2324present, the recipients are taken from all of the appropriate resent- lines,
2325and not from the ordinary To:, Cc:, etc. */
2326
2327if (extract_recip)
2328 {
2329 int rcount = 0;
2330 error_block **bnext = &bad_addresses;
2331
2332 if (extract_addresses_remove_arguments)
2333 {
2334 while (recipients_count-- > 0)
2335 {
2336 uschar *s = rewrite_address(recipients_list[recipients_count].address,
2337 TRUE, TRUE, global_rewrite_rules, rewrite_existflags);
2338 tree_add_nonrecipient(s);
2339 }
2340 recipients_list = NULL;
2341 recipients_count = recipients_list_max = 0;
2342 }
2343
059ec3d9
PH
2344 /* Now scan the headers */
2345
2346 for (h = header_list->next; h != NULL; h = h->next)
2347 {
2348 if ((h->type == htype_to || h->type == htype_cc || h->type == htype_bcc) &&
2349 (!contains_resent_headers || strncmpic(h->text, US"resent-", 7) == 0))
2350 {
2351 uschar *s = Ustrchr(h->text, ':') + 1;
2352 while (isspace(*s)) s++;
2353
1eccaa59
PH
2354 parse_allow_group = TRUE; /* Allow address group syntax */
2355
059ec3d9
PH
2356 while (*s != 0)
2357 {
2358 uschar *ss = parse_find_address_end(s, FALSE);
2359 uschar *recipient, *errmess, *p, *pp;
2360 int start, end, domain;
2361
2362 /* Check on maximum */
2363
2364 if (recipients_max > 0 && ++rcount > recipients_max)
2365 {
2366 give_local_error(ERRMESS_TOOMANYRECIP, US"too many recipients",
2367 US"message rejected: ", error_rc, stdin, NULL);
2368 /* Does not return */
2369 }
2370
2371 /* Make a copy of the address, and remove any internal newlines. These
2372 may be present as a result of continuations of the header line. The
2373 white space that follows the newline must not be removed - it is part
2374 of the header. */
2375
2376 pp = recipient = store_get(ss - s + 1);
2377 for (p = s; p < ss; p++) if (*p != '\n') *pp++ = *p;
2378 *pp = 0;
250b6871 2379
8c5d388a 2380#ifdef SUPPORT_I18N
250b6871
JH
2381 {
2382 BOOL b = allow_utf8_domains;
2383 allow_utf8_domains = TRUE;
2384#endif
059ec3d9
PH
2385 recipient = parse_extract_address(recipient, &errmess, &start, &end,
2386 &domain, FALSE);
2387
8c5d388a 2388#ifdef SUPPORT_I18N
250b6871
JH
2389 if (string_is_utf8(recipient))
2390 message_smtputf8 = TRUE;
2391 else
2392 allow_utf8_domains = b;
2393 }
2394#endif
2395
059ec3d9
PH
2396 /* Keep a list of all the bad addresses so we can send a single
2397 error message at the end. However, an empty address is not an error;
2398 just ignore it. This can come from an empty group list like
2399
2400 To: Recipients of list:;
2401
2402 If there are no recipients at all, an error will occur later. */
2403
2404 if (recipient == NULL && Ustrcmp(errmess, "empty address") != 0)
2405 {
2406 int len = Ustrlen(s);
2407 error_block *b = store_get(sizeof(error_block));
2408 while (len > 0 && isspace(s[len-1])) len--;
2409 b->next = NULL;
2410 b->text1 = string_printing(string_copyn(s, len));
2411 b->text2 = errmess;
2412 *bnext = b;
2413 bnext = &(b->next);
2414 }
2415
2416 /* If the recipient is already in the nonrecipients tree, it must
2417 have appeared on the command line with the option extract_addresses_
2418 remove_arguments set. Do not add it to the recipients, and keep a note
2419 that this has happened, in order to give a better error if there are
2420 no recipients left. */
2421
2422 else if (recipient != NULL)
2423 {
2424 if (tree_search(tree_nonrecipients, recipient) == NULL)
2425 receive_add_recipient(recipient, -1);
2426 else
2427 extracted_ignored = TRUE;
2428 }
2429
2430 /* Move on past this address */
2431
2432 s = ss + (*ss? 1:0);
2433 while (isspace(*s)) s++;
1eccaa59
PH
2434 } /* Next address */
2435
2436 parse_allow_group = FALSE; /* Reset group syntax flags */
2437 parse_found_group = FALSE;
059ec3d9
PH
2438
2439 /* If this was the bcc: header, mark it "old", which means it
2440 will be kept on the spool, but not transmitted as part of the
2441 message. */
2442
2cbb4081 2443 if (h->type == htype_bcc) h->type = htype_old;
059ec3d9
PH
2444 } /* For appropriate header line */
2445 } /* For each header line */
2446
059ec3d9
PH
2447 }
2448
2449/* Now build the unique message id. This has changed several times over the
2450lifetime of Exim. This description was rewritten for Exim 4.14 (February 2003).
2451Retaining all the history in the comment has become too unwieldy - read
2452previous release sources if you want it.
2453
2454The message ID has 3 parts: tttttt-pppppp-ss. Each part is a number in base 62.
2455The first part is the current time, in seconds. The second part is the current
2456pid. Both are large enough to hold 32-bit numbers in base 62. The third part
2457can hold a number in the range 0-3843. It used to be a computed sequence
2458number, but is now the fractional component of the current time in units of
24591/2000 of a second (i.e. a value in the range 0-1999). After a message has been
2460received, Exim ensures that the timer has ticked at the appropriate level
2461before proceeding, to avoid duplication if the pid happened to be re-used
2462within the same time period. It seems likely that most messages will take at
2463least half a millisecond to be received, so no delay will normally be
2464necessary. At least for some time...
2465
2466There is a modification when localhost_number is set. Formerly this was allowed
2467to be as large as 255. Now it is restricted to the range 0-16, and the final
2468component of the message id becomes (localhost_number * 200) + fractional time
2469in units of 1/200 of a second (i.e. a value in the range 0-3399).
2470
2471Some not-really-Unix operating systems use case-insensitive file names (Darwin,
2472Cygwin). For these, we have to use base 36 instead of base 62. Luckily, this
2473still allows the tttttt field to hold a large enough number to last for some
2474more decades, and the final two-digit field can hold numbers up to 1295, which
2475is enough for milliseconds (instead of 1/2000 of a second).
2476
2477However, the pppppp field cannot hold a 32-bit pid, but it can hold a 31-bit
2478pid, so it is probably safe because pids have to be positive. The
2479localhost_number is restricted to 0-10 for these hosts, and when it is set, the
2480final field becomes (localhost_number * 100) + fractional time in centiseconds.
2481
2482Note that string_base62() returns its data in a static storage block, so it
2483must be copied before calling string_base62() again. It always returns exactly
24846 characters.
2485
2486There doesn't seem to be anything in the RFC which requires a message id to
2487start with a letter, but Smail was changed to ensure this. The external form of
2488the message id (as supplied by string expansion) therefore starts with an
2489additional leading 'E'. The spool file names do not include this leading
2490letter and it is not used internally.
2491
2492NOTE: If ever the format of message ids is changed, the regular expression for
2493checking that a string is in this format must be updated in a corresponding
2494way. It appears in the initializing code in exim.c. The macro MESSAGE_ID_LENGTH
2495must also be changed to reflect the correct string length. Then, of course,
2496other programs that rely on the message id format will need updating too. */
2497
2498Ustrncpy(message_id, string_base62((long int)(message_id_tv.tv_sec)), 6);
2499message_id[6] = '-';
2500Ustrncpy(message_id + 7, string_base62((long int)getpid()), 6);
2501
2502/* Deal with the case where the host number is set. The value of the number was
2503checked when it was read, to ensure it isn't too big. The timing granularity is
2504left in id_resolution so that an appropriate wait can be done after receiving
2505the message, if necessary (we hope it won't be). */
2506
2507if (host_number_string != NULL)
2508 {
2509 id_resolution = (BASE_62 == 62)? 5000 : 10000;
2510 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2511 string_base62((long int)(
2512 host_number * (1000000/id_resolution) +
2513 message_id_tv.tv_usec/id_resolution)) + 4);
2514 }
2515
2516/* Host number not set: final field is just the fractional time at an
2517appropriate resolution. */
2518
2519else
2520 {
2521 id_resolution = (BASE_62 == 62)? 500 : 1000;
2522 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2523 string_base62((long int)(message_id_tv.tv_usec/id_resolution)) + 4);
2524 }
2525
2526/* Add the current message id onto the current process info string if
2527it will fit. */
2528
2529(void)string_format(process_info + process_info_len,
2530 PROCESS_INFO_SIZE - process_info_len, " id=%s", message_id);
2531
2532/* If we are using multiple input directories, set up the one for this message
2533to be the least significant base-62 digit of the time of arrival. Otherwise
2534ensure that it is an empty string. */
2535
a2da3176 2536message_subdir[0] = split_spool_directory ? message_id[5] : 0;
059ec3d9
PH
2537
2538/* Now that we have the message-id, if there is no message-id: header, generate
8800895a
PH
2539one, but only for local (without suppress_local_fixups) or submission mode
2540messages. This can be user-configured if required, but we had better flatten
2541any illegal characters therein. */
059ec3d9 2542
8800895a
PH
2543if (msgid_header == NULL &&
2544 ((sender_host_address == NULL && !suppress_local_fixups)
2545 || submission_mode))
059ec3d9
PH
2546 {
2547 uschar *p;
2548 uschar *id_text = US"";
2549 uschar *id_domain = primary_hostname;
2550
2551 /* Permit only letters, digits, dots, and hyphens in the domain */
2552
2553 if (message_id_domain != NULL)
2554 {
2555 uschar *new_id_domain = expand_string(message_id_domain);
2556 if (new_id_domain == NULL)
2557 {
2558 if (!expand_string_forcedfail)
2559 log_write(0, LOG_MAIN|LOG_PANIC,
2560 "expansion of \"%s\" (message_id_header_domain) "
2561 "failed: %s", message_id_domain, expand_string_message);
2562 }
2563 else if (*new_id_domain != 0)
2564 {
2565 id_domain = new_id_domain;
2566 for (p = id_domain; *p != 0; p++)
2567 if (!isalnum(*p) && *p != '.') *p = '-'; /* No need to test '-' ! */
2568 }
2569 }
2570
2571 /* Permit all characters except controls and RFC 2822 specials in the
2572 additional text part. */
2573
2574 if (message_id_text != NULL)
2575 {
2576 uschar *new_id_text = expand_string(message_id_text);
2577 if (new_id_text == NULL)
2578 {
2579 if (!expand_string_forcedfail)
2580 log_write(0, LOG_MAIN|LOG_PANIC,
2581 "expansion of \"%s\" (message_id_header_text) "
2582 "failed: %s", message_id_text, expand_string_message);
2583 }
2584 else if (*new_id_text != 0)
2585 {
2586 id_text = new_id_text;
2587 for (p = id_text; *p != 0; p++)
2588 if (mac_iscntrl_or_special(*p)) *p = '-';
2589 }
2590 }
2591
e7e680d6
PP
2592 /* Add the header line
2593 * Resent-* headers are prepended, per RFC 5322 3.6.6. Non-Resent-* are
2594 * appended, to preserve classical expectations of header ordering. */
059ec3d9 2595
e7e680d6 2596 header_add_at_position(!resents_exist, NULL, FALSE, htype_id,
5eb690a1
NM
2597 "%sMessage-Id: <%s%s%s@%s>\n", resent_prefix, message_id_external,
2598 (*id_text == 0)? "" : ".", id_text, id_domain);
059ec3d9
PH
2599 }
2600
2601/* If we are to log recipients, keep a copy of the raw ones before any possible
2602rewriting. Must copy the count, because later ACLs and the local_scan()
2603function may mess with the real recipients. */
2604
6c6d6e48 2605if (LOGGING(received_recipients))
059ec3d9
PH
2606 {
2607 raw_recipients = store_get(recipients_count * sizeof(uschar *));
2608 for (i = 0; i < recipients_count; i++)
2609 raw_recipients[i] = string_copy(recipients_list[i].address);
2610 raw_recipients_count = recipients_count;
2611 }
2612
2613/* Ensure the recipients list is fully qualified and rewritten. Unqualified
2614recipients will get here only if the conditions were right (allow_unqualified_
2615recipient is TRUE). */
2616
2617for (i = 0; i < recipients_count; i++)
2618 recipients_list[i].address =
2619 rewrite_address(recipients_list[i].address, TRUE, TRUE,
2620 global_rewrite_rules, rewrite_existflags);
2621
8800895a
PH
2622/* If there is no From: header, generate one for local (without
2623suppress_local_fixups) or submission_mode messages. If there is no sender
2624address, but the sender is local or this is a local delivery error, use the
2625originator login. This shouldn't happen for genuine bounces, but might happen
2626for autoreplies. The addition of From: must be done *before* checking for the
2627possible addition of a Sender: header, because untrusted_set_sender allows an
2628untrusted user to set anything in the envelope (which might then get info
2629From:) but we still want to ensure a valid Sender: if it is required. */
2630
2631if (from_header == NULL &&
2632 ((sender_host_address == NULL && !suppress_local_fixups)
2633 || submission_mode))
059ec3d9 2634 {
2fe1a124
PH
2635 uschar *oname = US"";
2636
2637 /* Use the originator_name if this is a locally submitted message and the
2638 caller is not trusted. For trusted callers, use it only if -F was used to
2639 force its value or if we have a non-SMTP message for which -f was not used
2640 to set the sender. */
2641
2642 if (sender_host_address == NULL)
2643 {
2644 if (!trusted_caller || sender_name_forced ||
2645 (!smtp_input && !sender_address_forced))
2646 oname = originator_name;
2647 }
2648
2649 /* For non-locally submitted messages, the only time we use the originator
2650 name is when it was forced by the /name= option on control=submission. */
2651
2652 else
2653 {
2654 if (submission_name != NULL) oname = submission_name;
2655 }
2656
059ec3d9
PH
2657 /* Envelope sender is empty */
2658
2659 if (sender_address[0] == 0)
2660 {
87ba3f5f
PH
2661 uschar *fromstart, *fromend;
2662
2663 fromstart = string_sprintf("%sFrom: %s%s", resent_prefix,
2fe1a124
PH
2664 oname, (oname[0] == 0)? "" : " <");
2665 fromend = (oname[0] == 0)? US"" : US">";
87ba3f5f 2666
059ec3d9
PH
2667 if (sender_local || local_error_message)
2668 {
87ba3f5f
PH
2669 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2670 local_part_quote(originator_login), qualify_domain_sender,
2671 fromend);
059ec3d9
PH
2672 }
2673 else if (submission_mode && authenticated_id != NULL)
2674 {
2675 if (submission_domain == NULL)
2676 {
87ba3f5f
PH
2677 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2678 local_part_quote(authenticated_id), qualify_domain_sender,
2679 fromend);
059ec3d9
PH
2680 }
2681 else if (submission_domain[0] == 0) /* empty => whole address set */
2682 {
87ba3f5f
PH
2683 header_add(htype_from, "%s%s%s\n", fromstart, authenticated_id,
2684 fromend);
059ec3d9
PH
2685 }
2686 else
2687 {
87ba3f5f
PH
2688 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2689 local_part_quote(authenticated_id), submission_domain,
2690 fromend);
059ec3d9
PH
2691 }
2692 from_header = header_last; /* To get it checked for Sender: */
2693 }
2694 }
2695
2696 /* There is a non-null envelope sender. Build the header using the original
2697 sender address, before any rewriting that might have been done while
2698 verifying it. */
2699
2700 else
2701 {
87ba3f5f 2702 header_add(htype_from, "%sFrom: %s%s%s%s\n", resent_prefix,
2fe1a124
PH
2703 oname,
2704 (oname[0] == 0)? "" : " <",
87ba3f5f
PH
2705 (sender_address_unrewritten == NULL)?
2706 sender_address : sender_address_unrewritten,
2fe1a124 2707 (oname[0] == 0)? "" : ">");
059ec3d9
PH
2708
2709 from_header = header_last; /* To get it checked for Sender: */
2710 }
2711 }
2712
2713
8800895a
PH
2714/* If the sender is local (without suppress_local_fixups), or if we are in
2715submission mode and there is an authenticated_id, check that an existing From:
2716is correct, and if not, generate a Sender: header, unless disabled. Any
2717previously-existing Sender: header was removed above. Note that sender_local,
2718as well as being TRUE if the caller of exim is not trusted, is also true if a
2719trusted caller did not supply a -f argument for non-smtp input. To allow
2720trusted callers to forge From: without supplying -f, we have to test explicitly
2721here. If the From: header contains more than one address, then the call to
2722parse_extract_address fails, and a Sender: header is inserted, as required. */
059ec3d9
PH
2723
2724if (from_header != NULL &&
69358f02 2725 (active_local_from_check &&
8800895a 2726 ((sender_local && !trusted_caller && !suppress_local_fixups) ||
69358f02 2727 (submission_mode && authenticated_id != NULL))
059ec3d9
PH
2728 ))
2729 {
2730 BOOL make_sender = TRUE;
2731 int start, end, domain;
2732 uschar *errmess;
2733 uschar *from_address =
2734 parse_extract_address(Ustrchr(from_header->text, ':') + 1, &errmess,
2735 &start, &end, &domain, FALSE);
2736 uschar *generated_sender_address;
2737
2738 if (submission_mode)
2739 {
2740 if (submission_domain == NULL)
2741 {
2742 generated_sender_address = string_sprintf("%s@%s",
2743 local_part_quote(authenticated_id), qualify_domain_sender);
2744 }
2745 else if (submission_domain[0] == 0) /* empty => full address */
2746 {
2747 generated_sender_address = string_sprintf("%s",
2748 authenticated_id);
2749 }
2750 else
2751 {
2752 generated_sender_address = string_sprintf("%s@%s",
2753 local_part_quote(authenticated_id), submission_domain);
2754 }
2755 }
2756 else
2757 generated_sender_address = string_sprintf("%s@%s",
2758 local_part_quote(originator_login), qualify_domain_sender);
2759
2760 /* Remove permitted prefixes and suffixes from the local part of the From:
2761 address before doing the comparison with the generated sender. */
2762
2763 if (from_address != NULL)
2764 {
2765 int slen;
2766 uschar *at = (domain == 0)? NULL : from_address + domain - 1;
2767
2768 if (at != NULL) *at = 0;
2769 from_address += route_check_prefix(from_address, local_from_prefix);
2770 slen = route_check_suffix(from_address, local_from_suffix);
2771 if (slen > 0)
2772 {
2773 memmove(from_address+slen, from_address, Ustrlen(from_address)-slen);
2774 from_address += slen;
2775 }
2776 if (at != NULL) *at = '@';
2777
2778 if (strcmpic(generated_sender_address, from_address) == 0 ||
2779 (domain == 0 && strcmpic(from_address, originator_login) == 0))
2780 make_sender = FALSE;
2781 }
2782
2783 /* We have to cause the Sender header to be rewritten if there are
2784 appropriate rewriting rules. */
2785
2786 if (make_sender)
2787 {
2fe1a124 2788 if (submission_mode && submission_name == NULL)
059ec3d9
PH
2789 header_add(htype_sender, "%sSender: %s\n", resent_prefix,
2790 generated_sender_address);
2791 else
2792 header_add(htype_sender, "%sSender: %s <%s>\n",
2fe1a124
PH
2793 resent_prefix,
2794 submission_mode? submission_name : originator_name,
2795 generated_sender_address);
059ec3d9 2796 }
87ba3f5f
PH
2797
2798 /* Ensure that a non-null envelope sender address corresponds to the
2799 submission mode sender address. */
2800
2801 if (submission_mode && sender_address[0] != 0)
2802 {
2803 if (sender_address_unrewritten == NULL)
2804 sender_address_unrewritten = sender_address;
2805 sender_address = generated_sender_address;
089793a4
TF
2806 if (Ustrcmp(sender_address_unrewritten, generated_sender_address) != 0)
2807 log_write(L_address_rewrite, LOG_MAIN,
2808 "\"%s\" from env-from rewritten as \"%s\" by submission mode",
2809 sender_address_unrewritten, generated_sender_address);
87ba3f5f 2810 }
059ec3d9
PH
2811 }
2812
059ec3d9
PH
2813/* If there are any rewriting rules, apply them to the sender address, unless
2814it has already been rewritten as part of verification for SMTP input. */
2815
2816if (global_rewrite_rules != NULL && sender_address_unrewritten == NULL &&
2817 sender_address[0] != 0)
2818 {
2819 sender_address = rewrite_address(sender_address, FALSE, TRUE,
2820 global_rewrite_rules, rewrite_existflags);
2821 DEBUG(D_receive|D_rewrite)
2822 debug_printf("rewritten sender = %s\n", sender_address);
2823 }
2824
2825
2826/* The headers must be run through rewrite_header(), because it ensures that
2827addresses are fully qualified, as well as applying any rewriting rules that may
2828exist.
2829
2830Qualification of header addresses in a message from a remote host happens only
2831if the host is in sender_unqualified_hosts or recipient_unqualified hosts, as
2832appropriate. For local messages, qualification always happens, unless -bnq is
2833used to explicitly suppress it. No rewriting is done for an unqualified address
2834that is left untouched.
2835
2836We start at the second header, skipping our own Received:. This rewriting is
2837documented as happening *after* recipient addresses are taken from the headers
2838by the -t command line option. An added Sender: gets rewritten here. */
2839
2840for (h = header_list->next; h != NULL; h = h->next)
2841 {
2842 header_line *newh = rewrite_header(h, NULL, NULL, global_rewrite_rules,
2843 rewrite_existflags, TRUE);
2844 if (newh != NULL) h = newh;
2845 }
2846
2847
2848/* An RFC 822 (sic) message is not legal unless it has at least one of "to",
2cbb4081 2849"cc", or "bcc". Note that although the minimal examples in RFC 822 show just
059ec3d9
PH
2850"to" or "bcc", the full syntax spec allows "cc" as well. If any resent- header
2851exists, this applies to the set of resent- headers rather than the normal set.
2852
2cbb4081
PH
2853The requirement for a recipient header has been removed in RFC 2822. At this
2854point in the code, earlier versions of Exim added a To: header for locally
2855submitted messages, and an empty Bcc: header for others. In the light of the
2856changes in RFC 2822, this was dropped in November 2003. */
059ec3d9 2857
059ec3d9
PH
2858
2859/* If there is no date header, generate one if the message originates locally
8800895a
PH
2860(i.e. not over TCP/IP) and suppress_local_fixups is not set, or if the
2861submission mode flag is set. Messages without Date: are not valid, but it seems
e7e680d6
PP
2862to be more confusing if Exim adds one to all remotely-originated messages.
2863As per Message-Id, we prepend if resending, else append.
2864*/
059ec3d9 2865
8800895a
PH
2866if (!date_header_exists &&
2867 ((sender_host_address == NULL && !suppress_local_fixups)
2868 || submission_mode))
e7e680d6
PP
2869 header_add_at_position(!resents_exist, NULL, FALSE, htype_other,
2870 "%sDate: %s\n", resent_prefix, tod_stamp(tod_full));
059ec3d9
PH
2871
2872search_tidyup(); /* Free any cached resources */
2873
2874/* Show the complete set of headers if debugging. Note that the first one (the
2875new Received:) has not yet been set. */
2876
2877DEBUG(D_receive)
2878 {
2879 debug_printf(">>Headers after rewriting and local additions:\n");
2880 for (h = header_list->next; h != NULL; h = h->next)
2881 debug_printf("%c %s", h->type, h->text);
2882 debug_printf("\n");
2883 }
2884
2885/* The headers are now complete in store. If we are running in filter
2886testing mode, that is all this function does. Return TRUE if the message
2887ended with a dot. */
2888
f05da2e8 2889if (filter_test != FTEST_NONE)
059ec3d9
PH
2890 {
2891 process_info[process_info_len] = 0;
2892 return message_ended == END_DOT;
2893 }
2894
7e3ce68e
JH
2895/*XXX CHUNKING: need to cancel cutthrough under BDAT, for now. In future,
2896think more if it could be handled. Cannot do onward CHUNKING unless
2897inbound is, but inbound chunking ought to be ok with outbound plain.
2898Could we do onward CHUNKING given inbound CHUNKING?
2899*/
2900if (chunking_state > CHUNKING_OFFERED)
2901 cancel_cutthrough_connection("chunking active");
2902
817d9f57 2903/* Cutthrough delivery:
5032d1cf
JH
2904We have to create the Received header now rather than at the end of reception,
2905so the timestamp behaviour is a change to the normal case.
2906XXX Ensure this gets documented XXX.
2907Having created it, send the headers to the destination. */
2908if (cutthrough.fd >= 0)
e4bdf652 2909 {
817d9f57
JH
2910 if (received_count > received_headers_max)
2911 {
2e5b33cd 2912 cancel_cutthrough_connection("too many headers");
817d9f57
JH
2913 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2914 log_write(0, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2915 "Too many \"Received\" headers",
2916 sender_address,
2917 (sender_fullhost == NULL)? "" : " H=",
2918 (sender_fullhost == NULL)? US"" : sender_fullhost,
2919 (sender_ident == NULL)? "" : " U=",
2920 (sender_ident == NULL)? US"" : sender_ident);
2921 message_id[0] = 0; /* Indicate no message accepted */
2922 smtp_reply = US"550 Too many \"Received\" headers - suspected mail loop";
2923 goto TIDYUP; /* Skip to end of function */
2924 }
e4bdf652 2925 received_header_gen();
578d43dc 2926 add_acl_headers(ACL_WHERE_RCPT, US"MAIL or RCPT");
e4bdf652
JH
2927 (void) cutthrough_headers_send();
2928 }
61147df4 2929
e4bdf652 2930
059ec3d9
PH
2931/* Open a new spool file for the data portion of the message. We need
2932to access it both via a file descriptor and a stream. Try to make the
41313d92 2933directory if it isn't there. */
059ec3d9 2934
41313d92 2935spool_name = spool_fname(US"input", message_subdir, message_id, US"-D");
a2da3176
JH
2936DEBUG(D_receive) debug_printf("Data file name: %s\n", spool_name);
2937
2938if ((data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE)) < 0)
059ec3d9
PH
2939 {
2940 if (errno == ENOENT)
2941 {
0971ec06 2942 (void) directory_make(spool_directory,
41313d92
JH
2943 spool_sname(US"input", message_subdir),
2944 INPUT_DIRECTORY_MODE, TRUE);
059ec3d9
PH
2945 data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2946 }
2947 if (data_fd < 0)
2948 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Failed to create spool file %s: %s",
2949 spool_name, strerror(errno));
2950 }
2951
2952/* Make sure the file's group is the Exim gid, and double-check the mode
2953because the group setting doesn't always get set automatically. */
2954
1ac6b2e7
JH
2955if (fchown(data_fd, exim_uid, exim_gid))
2956 log_write(0, LOG_MAIN|LOG_PANIC_DIE,
2957 "Failed setting ownership on spool file %s: %s",
2958 spool_name, strerror(errno));
ff790e47 2959(void)fchmod(data_fd, SPOOL_MODE);
059ec3d9
PH
2960
2961/* We now have data file open. Build a stream for it and lock it. We lock only
2962the first line of the file (containing the message ID) because otherwise there
2963are problems when Exim is run under Cygwin (I'm told). See comments in
2964spool_in.c, where the same locking is done. */
2965
2966data_file = fdopen(data_fd, "w+");
2967lock_data.l_type = F_WRLCK;
2968lock_data.l_whence = SEEK_SET;
2969lock_data.l_start = 0;
2970lock_data.l_len = SPOOL_DATA_START_OFFSET;
2971
2972if (fcntl(data_fd, F_SETLK, &lock_data) < 0)
2973 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Cannot lock %s (%d): %s", spool_name,
2974 errno, strerror(errno));
2975
2976/* We have an open, locked data file. Write the message id to it to make it
2977self-identifying. Then read the remainder of the input of this message and
2978write it to the data file. If the variable next != NULL, it contains the first
2979data line (which was read as a header but then turned out not to have the right
2980format); write it (remembering that it might contain binary zeros). The result
2981of fwrite() isn't inspected; instead we call ferror() below. */
2982
2983fprintf(data_file, "%s-D\n", message_id);
2984if (next != NULL)
2985 {
2986 uschar *s = next->text;
2987 int len = next->slen;
1ac6b2e7 2988 len = fwrite(s, 1, len, data_file); len = len; /* compiler quietening */
059ec3d9
PH
2989 body_linecount++; /* Assumes only 1 line */
2990 }
2991
2992/* Note that we might already be at end of file, or the logical end of file
2993(indicated by '.'), or might have encountered an error while writing the
2994message id or "next" line. */
2995
2996if (!ferror(data_file) && !(receive_feof)() && message_ended != END_DOT)
2997 {
2998 if (smtp_input)
2999 {
7e3ce68e
JH
3000 message_ended = chunking_state > CHUNKING_OFFERED
3001 ? read_message_bdat_smtp(data_file)
3002 : read_message_data_smtp(data_file);
059ec3d9
PH
3003 receive_linecount++; /* The terminating "." line */
3004 }
3005 else message_ended = read_message_data(data_file);
3006
3007 receive_linecount += body_linecount; /* For BSMTP errors mainly */
2e0c1448 3008 message_linecount += body_linecount;
059ec3d9 3009
7e3ce68e 3010 switch (message_ended)
059ec3d9 3011 {
7e3ce68e 3012 /* Handle premature termination of SMTP */
059ec3d9 3013
7e3ce68e
JH
3014 case END_EOF:
3015 if (smtp_input)
3016 {
3017 Uunlink(spool_name); /* Lose data file when closed */
3018 cancel_cutthrough_connection("sender closed connection");
3019 message_id[0] = 0; /* Indicate no message accepted */
3020 smtp_reply = handle_lost_connection(US"");
3021 smtp_yield = FALSE;
3022 goto TIDYUP; /* Skip to end of function */
3023 }
3024 break;
059ec3d9 3025
7e3ce68e
JH
3026 /* Handle message that is too big. Don't use host_or_ident() in the log
3027 message; we want to see the ident value even for non-remote messages. */
059ec3d9 3028
7e3ce68e
JH
3029 case END_SIZE:
3030 Uunlink(spool_name); /* Lose the data file when closed */
3031 cancel_cutthrough_connection("mail too big");
3032 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
059ec3d9 3033
7e3ce68e
JH
3034 log_write(L_size_reject, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
3035 "message too big: read=%d max=%d",
3036 sender_address,
3037 (sender_fullhost == NULL)? "" : " H=",
3038 (sender_fullhost == NULL)? US"" : sender_fullhost,
3039 (sender_ident == NULL)? "" : " U=",
3040 (sender_ident == NULL)? US"" : sender_ident,
3041 message_size,
3042 thismessage_size_limit);
3043
3044 if (smtp_input)
3045 {
3046 smtp_reply = US"552 Message size exceeds maximum permitted";
3047 message_id[0] = 0; /* Indicate no message accepted */
3048 goto TIDYUP; /* Skip to end of function */
3049 }
3050 else
3051 {
3052 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3053 give_local_error(ERRMESS_TOOBIG,
3054 string_sprintf("message too big (max=%d)", thismessage_size_limit),
3055 US"message rejected: ", error_rc, data_file, header_list);
3056 /* Does not return */
3057 }
3058 break;
3059
3060 /* Handle bad BDAT protocol sequence */
3061
3062 case END_PROTOCOL:
3063 Uunlink(spool_name); /* Lose the data file when closed */
3064 cancel_cutthrough_connection("sender protocol error");
3065 smtp_reply = US""; /* Response already sent */
3066 message_id[0] = 0; /* Indicate no message accepted */
3067 goto TIDYUP; /* Skip to end of function */
059ec3d9
PH
3068 }
3069 }
3070
3071/* Restore the standard SIGALRM handler for any subsequent processing. (For
3072example, there may be some expansion in an ACL that uses a timer.) */
3073
3074os_non_restarting_signal(SIGALRM, sigalrm_handler);
3075
3076/* The message body has now been read into the data file. Call fflush() to
3077empty the buffers in C, and then call fsync() to get the data written out onto
3078the disk, as fflush() doesn't do this (or at least, it isn't documented as
3079having to do this). If there was an I/O error on either input or output,
3080attempt to send an error message, and unlink the spool file. For non-SMTP input
3081we can then give up. Note that for SMTP input we must swallow the remainder of
3082the input in cases of output errors, since the far end doesn't expect to see
3083anything until the terminating dot line is sent. */
3084
3085if (fflush(data_file) == EOF || ferror(data_file) ||
54fc8428 3086 EXIMfsync(fileno(data_file)) < 0 || (receive_ferror)())
059ec3d9
PH
3087 {
3088 uschar *msg_errno = US strerror(errno);
3089 BOOL input_error = (receive_ferror)() != 0;
3090 uschar *msg = string_sprintf("%s error (%s) while receiving message from %s",
3091 input_error? "Input read" : "Spool write",
3092 msg_errno,
3093 (sender_fullhost != NULL)? sender_fullhost : sender_ident);
3094
3095 log_write(0, LOG_MAIN, "Message abandoned: %s", msg);
3096 Uunlink(spool_name); /* Lose the data file */
2e5b33cd 3097 cancel_cutthrough_connection("error writing spoolfile");
059ec3d9
PH
3098
3099 if (smtp_input)
3100 {
3101 if (input_error)
3102 smtp_reply = US"451 Error while reading input data";
3103 else
3104 {
3105 smtp_reply = US"451 Error while writing spool file";
3106 receive_swallow_smtp();
3107 }
3108 message_id[0] = 0; /* Indicate no message accepted */
3109 goto TIDYUP; /* Skip to end of function */
3110 }
3111
3112 else
3113 {
3114 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3115 give_local_error(ERRMESS_IOERR, msg, US"", error_rc, data_file,
3116 header_list);
3117 /* Does not return */
3118 }
3119 }
3120
3121
3122/* No I/O errors were encountered while writing the data file. */
3123
3124DEBUG(D_receive) debug_printf("Data file written for message %s\n", message_id);
3125
3126
3127/* If there were any bad addresses extracted by -t, or there were no recipients
3128left after -t, send a message to the sender of this message, or write it to
3129stderr if the error handling option is set that way. Note that there may
3130legitimately be no recipients for an SMTP message if they have all been removed
3131by "discard".
3132
3133We need to rewind the data file in order to read it. In the case of no
3134recipients or stderr error writing, throw the data file away afterwards, and
3135exit. (This can't be SMTP, which always ensures there's at least one
3136syntactically good recipient address.) */
3137
3138if (extract_recip && (bad_addresses != NULL || recipients_count == 0))
3139 {
3140 DEBUG(D_receive)
3141 {
3142 if (recipients_count == 0) debug_printf("*** No recipients\n");
3143 if (bad_addresses != NULL)
3144 {
3145 error_block *eblock = bad_addresses;
3146 debug_printf("*** Bad address(es)\n");
3147 while (eblock != NULL)
3148 {
3149 debug_printf(" %s: %s\n", eblock->text1, eblock->text2);
3150 eblock = eblock->next;
3151 }
3152 }
3153 }
3154
3155 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3156
3157 /* If configured to send errors to the sender, but this fails, force
3158 a failure error code. We use a special one for no recipients so that it
3159 can be detected by the autoreply transport. Otherwise error_rc is set to
3160 errors_sender_rc, which is EXIT_FAILURE unless -oee was given, in which case
3161 it is EXIT_SUCCESS. */
3162
3163 if (error_handling == ERRORS_SENDER)
3164 {
3165 if (!moan_to_sender(
3166 (bad_addresses == NULL)?
3167 (extracted_ignored? ERRMESS_IGADDRESS : ERRMESS_NOADDRESS) :
3168 (recipients_list == NULL)? ERRMESS_BADNOADDRESS : ERRMESS_BADADDRESS,
3169 bad_addresses, header_list, data_file, FALSE))
3170 error_rc = (bad_addresses == NULL)? EXIT_NORECIPIENTS : EXIT_FAILURE;
3171 }
3172 else
3173 {
3174 if (bad_addresses == NULL)
3175 {
3176 if (extracted_ignored)
3177 fprintf(stderr, "exim: all -t recipients overridden by command line\n");
3178 else
3179 fprintf(stderr, "exim: no recipients in message\n");
3180 }
3181 else
3182 {
3183 fprintf(stderr, "exim: invalid address%s",
3184 (bad_addresses->next == NULL)? ":" : "es:\n");
3185 while (bad_addresses != NULL)
3186 {
3187 fprintf(stderr, " %s: %s\n", bad_addresses->text1,
3188 bad_addresses->text2);
3189 bad_addresses = bad_addresses->next;
3190 }
3191 }
3192 }
3193
3194 if (recipients_count == 0 || error_handling == ERRORS_STDERR)
3195 {
3196 Uunlink(spool_name);
f1e894f3 3197 (void)fclose(data_file);
059ec3d9
PH
3198 exim_exit(error_rc);
3199 }
3200 }
3201
3202/* Data file successfully written. Generate text for the Received: header by
3203expanding the configured string, and adding a timestamp. By leaving this
3204operation till now, we ensure that the timestamp is the time that message
3205reception was completed. However, this is deliberately done before calling the
3206data ACL and local_scan().
3207
3208This Received: header may therefore be inspected by the data ACL and by code in
3209the local_scan() function. When they have run, we update the timestamp to be
3210the final time of reception.
3211
3212If there is just one recipient, set up its value in the $received_for variable
3213for use when we generate the Received: header.
3214
3215Note: the checking for too many Received: headers is handled by the delivery
3216code. */
e4bdf652 3217/*XXX eventually add excess Received: check for cutthrough case back when classifying them */
059ec3d9 3218
e4bdf652 3219if (received_header->text == NULL) /* Non-cutthrough case */
059ec3d9 3220 {
e4bdf652 3221 received_header_gen();
059ec3d9 3222
e4bdf652 3223 /* Set the value of message_body_size for the DATA ACL and for local_scan() */
059ec3d9 3224
e4bdf652
JH
3225 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3226 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9 3227
e4bdf652
JH
3228 /* If an ACL from any RCPT commands set up any warning headers to add, do so
3229 now, before running the DATA ACL. */
059ec3d9 3230
578d43dc 3231 add_acl_headers(ACL_WHERE_RCPT, US"MAIL or RCPT");
e4bdf652 3232 }
817d9f57 3233else
e4bdf652
JH
3234 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3235 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9
PH
3236
3237/* If an ACL is specified for checking things at this stage of reception of a
3238message, run it, unless all the recipients were removed by "discard" in earlier
3239ACLs. That is the only case in which recipients_count can be zero at this
3240stage. Set deliver_datafile to point to the data file so that $message_body and
3241$message_body_end can be extracted if needed. Allow $recipients in expansions.
3242*/
3243
3244deliver_datafile = data_fd;
4e88a19f 3245user_msg = NULL;
059ec3d9 3246
0e20aff9
MH
3247enable_dollar_recipients = TRUE;
3248
059ec3d9 3249if (recipients_count == 0)
7e3ce68e
JH
3250 blackholed_by = recipients_discarded ? US"MAIL ACL" : US"RCPT ACL";
3251
059ec3d9
PH
3252else
3253 {
059ec3d9
PH
3254 /* Handle interactive SMTP messages */
3255
3256 if (smtp_input && !smtp_batched_input)
3257 {
8523533c 3258
80a47a2c
TK
3259#ifndef DISABLE_DKIM
3260 if (!dkim_disable_verify)
3261 {
3262 /* Finish verification, this will log individual signature results to
3263 the mainlog */
3264 dkim_exim_verify_finish();
3265
3266 /* Check if we must run the DKIM ACL */
7e3ce68e 3267 if (acl_smtp_dkim && dkim_verify_signers && *dkim_verify_signers)
80a47a2c
TK
3268 {
3269 uschar *dkim_verify_signers_expanded =
3270 expand_string(dkim_verify_signers);
7e3ce68e 3271 if (!dkim_verify_signers_expanded)
80a47a2c
TK
3272 log_write(0, LOG_MAIN|LOG_PANIC,
3273 "expansion of dkim_verify_signers option failed: %s",
3274 expand_string_message);
7e3ce68e 3275
80a47a2c
TK
3276 else
3277 {
3278 int sep = 0;
55414b25 3279 const uschar *ptr = dkim_verify_signers_expanded;
80a47a2c 3280 uschar *item = NULL;
9e5d6b55
TK
3281 uschar *seen_items = NULL;
3282 int seen_items_size = 0;
3283 int seen_items_offset = 0;
9122af94
TK
3284 /* Default to OK when no items are present */
3285 rc = OK;
7e3ce68e 3286 while ((item = string_nextinlist(&ptr, &sep, NULL, 0)))
80a47a2c 3287 {
6119d1ea 3288 /* Prevent running ACL for an empty item */
7e3ce68e 3289 if (!item || !*item) continue;
5032d1cf
JH
3290
3291 /* Only run ACL once for each domain or identity,
3292 no matter how often it appears in the expanded list. */
3293 if (seen_items)
6119d1ea 3294 {
ae9094bf 3295 uschar *seen_item = NULL;
55414b25 3296 const uschar *seen_items_list = seen_items;
5032d1cf 3297 BOOL seen_this_item = FALSE;
61147df4 3298
ae9094bf 3299 while ((seen_item = string_nextinlist(&seen_items_list, &sep,
7e3ce68e 3300 NULL, 0)))
5032d1cf
JH
3301 if (Ustrcmp(seen_item,item) == 0)
3302 {
3303 seen_this_item = TRUE;
3304 break;
3305 }
3306
3307 if (seen_this_item)
6119d1ea
TK
3308 {
3309 DEBUG(D_receive)
5032d1cf
JH
3310 debug_printf("acl_smtp_dkim: skipping signer %s, "
3311 "already seen\n", item);
6119d1ea
TK
3312 continue;
3313 }
61147df4 3314
5032d1cf
JH
3315 seen_items = string_append(seen_items, &seen_items_size,
3316 &seen_items_offset, 1, ":");
6119d1ea
TK
3317 }
3318
5032d1cf
JH
3319 seen_items = string_append(seen_items, &seen_items_size,
3320 &seen_items_offset, 1, item);
4a73449b 3321 seen_items[seen_items_offset] = '\0';
6119d1ea
TK
3322
3323 DEBUG(D_receive)
5032d1cf
JH
3324 debug_printf("calling acl_smtp_dkim for dkim_cur_signer=%s\n",
3325 item);
6119d1ea 3326
80a47a2c 3327 dkim_exim_acl_setup(item);
5032d1cf
JH
3328 rc = acl_check(ACL_WHERE_DKIM, NULL, acl_smtp_dkim,
3329 &user_msg, &log_msg);
6119d1ea
TK
3330
3331 if (rc != OK)
5032d1cf
JH
3332 {
3333 DEBUG(D_receive)
3334 debug_printf("acl_smtp_dkim: acl_check returned %d on %s, "
3335 "skipping remaining items\n", rc, item);
3336 cancel_cutthrough_connection("dkim acl not ok");
3337 break;
3338 }
80a47a2c 3339 }
578d43dc 3340 add_acl_headers(ACL_WHERE_DKIM, US"DKIM");
80a47a2c
TK
3341 if (rc == DISCARD)
3342 {
3343 recipients_count = 0;
3344 blackholed_by = US"DKIM ACL";
3345 if (log_msg != NULL)
3346 blackhole_log_msg = string_sprintf(": %s", log_msg);
3347 }
3348 else if (rc != OK)
3349 {
3350 Uunlink(spool_name);
3351 if (smtp_handle_acl_fail(ACL_WHERE_DKIM, rc, user_msg, log_msg) != 0)
85ffcba6 3352 smtp_yield = FALSE; /* No more messages after dropped connection */
80a47a2c
TK
3353 smtp_reply = US""; /* Indicate reply already sent */
3354 message_id[0] = 0; /* Indicate no message accepted */
3355 goto TIDYUP; /* Skip to end of function */
3356 }
3357 }
3358 }
3359 }
4a8ce2d8 3360#endif /* DISABLE_DKIM */
fb2274d4 3361
8523533c 3362#ifdef WITH_CONTENT_SCAN
80a47a2c
TK
3363 if (recipients_count > 0 &&
3364 acl_smtp_mime != NULL &&
54cdb463
PH
3365 !run_mime_acl(acl_smtp_mime, &smtp_yield, &smtp_reply, &blackholed_by))
3366 goto TIDYUP;
8523533c
TK
3367#endif /* WITH_CONTENT_SCAN */
3368
4840604e
TL
3369#ifdef EXPERIMENTAL_DMARC
3370 dmarc_up = dmarc_store_data(from_header);
3371#endif /* EXPERIMENTAL_DMARC */
3372
8ccd00b1
JH
3373#ifndef DISABLE_PRDR
3374 if (prdr_requested && recipients_count > 1 && acl_smtp_data_prdr)
fd98a5c6
JH
3375 {
3376 unsigned int c;
3377 int all_pass = OK;
3378 int all_fail = FAIL;
3379
3380 smtp_printf("353 PRDR content analysis beginning\r\n");
3381 /* Loop through recipients, responses must be in same order received */
3382 for (c = 0; recipients_count > c; c++)
3383 {
3384 uschar * addr= recipients_list[c].address;
3385 uschar * msg= US"PRDR R=<%s> %s";
3386 uschar * code;
3387 DEBUG(D_receive)
3388 debug_printf("PRDR processing recipient %s (%d of %d)\n",
3389 addr, c+1, recipients_count);
3390 rc = acl_check(ACL_WHERE_PRDR, addr,
3391 acl_smtp_data_prdr, &user_msg, &log_msg);
3392
3393 /* If any recipient rejected content, indicate it in final message */
3394 all_pass |= rc;
3395 /* If all recipients rejected, indicate in final message */
3396 all_fail &= rc;
3397
3398 switch (rc)
3399 {
3400 case OK: case DISCARD: code = US"250"; break;
3401 case DEFER: code = US"450"; break;
3402 default: code = US"550"; break;
3403 }
3404 if (user_msg != NULL)
3405 smtp_user_msg(code, user_msg);
3406 else
3407 {
3408 switch (rc)
3409 {
3410 case OK: case DISCARD:
3411 msg = string_sprintf(CS msg, addr, "acceptance"); break;
3412 case DEFER:
3413 msg = string_sprintf(CS msg, addr, "temporary refusal"); break;
3414 default:
3415 msg = string_sprintf(CS msg, addr, "refusal"); break;
3416 }
3417 smtp_user_msg(code, msg);
3418 }
3419 if (log_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, log_msg);
3420 else if (user_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, user_msg);
112b6a93 3421 else log_write(0, LOG_MAIN, "%s", CS msg);
fd98a5c6
JH
3422
3423 if (rc != OK) { receive_remove_recipient(addr); c--; }
3424 }
3425 /* Set up final message, used if data acl gives OK */
3426 smtp_reply = string_sprintf("%s id=%s message %s",
3427 all_fail == FAIL ? US"550" : US"250",
3428 message_id,
3429 all_fail == FAIL
3430 ? US"rejected for all recipients"
3431 : all_pass == OK
3432 ? US"accepted"
3433 : US"accepted for some recipients");
3434 if (recipients_count == 0)
3435 {
3436 message_id[0] = 0; /* Indicate no message accepted */
3437 goto TIDYUP;
3438 }
3439 }
3440 else
3441 prdr_requested = FALSE;
8ccd00b1 3442#endif /* !DISABLE_PRDR */
fd98a5c6 3443
54cdb463
PH
3444 /* Check the recipients count again, as the MIME ACL might have changed
3445 them. */
8523533c 3446
059ec3d9
PH
3447 if (acl_smtp_data != NULL && recipients_count > 0)
3448 {
059ec3d9 3449 rc = acl_check(ACL_WHERE_DATA, NULL, acl_smtp_data, &user_msg, &log_msg);
578d43dc 3450 add_acl_headers(ACL_WHERE_DATA, US"DATA");
059ec3d9
PH
3451 if (rc == DISCARD)
3452 {
3453 recipients_count = 0;
3454 blackholed_by = US"DATA ACL";
8e669ac1
PH
3455 if (log_msg != NULL)
3456 blackhole_log_msg = string_sprintf(": %s", log_msg);
2e5b33cd 3457 cancel_cutthrough_connection("data acl discard");
059ec3d9
PH
3458 }
3459 else if (rc != OK)
3460 {
3461 Uunlink(spool_name);
2e5b33cd 3462 cancel_cutthrough_connection("data acl not ok");
8523533c
TK
3463#ifdef WITH_CONTENT_SCAN
3464 unspool_mbox();
6f0c431a
PP
3465#endif
3466#ifdef EXPERIMENTAL_DCC
3467 dcc_ok = 0;
8523533c 3468#endif
059ec3d9 3469 if (smtp_handle_acl_fail(ACL_WHERE_DATA, rc, user_msg, log_msg) != 0)
85ffcba6 3470 smtp_yield = FALSE; /* No more messages after dropped connection */
059ec3d9
PH
3471 smtp_reply = US""; /* Indicate reply already sent */
3472 message_id[0] = 0; /* Indicate no message accepted */
3473 goto TIDYUP; /* Skip to end of function */
3474 }
3475 }
3476 }
3477
3478 /* Handle non-SMTP and batch SMTP (i.e. non-interactive) messages. Note that
3479 we cannot take different actions for permanent and temporary rejections. */
3480
54cdb463 3481 else
059ec3d9 3482 {
54cdb463
PH
3483
3484#ifdef WITH_CONTENT_SCAN
3485 if (acl_not_smtp_mime != NULL &&
3486 !run_mime_acl(acl_not_smtp_mime, &smtp_yield, &smtp_reply,
3487 &blackholed_by))
3488 goto TIDYUP;
3489#endif /* WITH_CONTENT_SCAN */
3490
3491 if (acl_not_smtp != NULL)
059ec3d9 3492 {
54cdb463
PH
3493 uschar *user_msg, *log_msg;
3494 rc = acl_check(ACL_WHERE_NOTSMTP, NULL, acl_not_smtp, &user_msg, &log_msg);
3495 if (rc == DISCARD)
059ec3d9 3496 {
54cdb463
PH
3497 recipients_count = 0;
3498 blackholed_by = US"non-SMTP ACL";
3499 if (log_msg != NULL)
3500 blackhole_log_msg = string_sprintf(": %s", log_msg);
059ec3d9 3501 }
54cdb463 3502 else if (rc != OK)
059ec3d9 3503 {
54cdb463
PH
3504 Uunlink(spool_name);
3505#ifdef WITH_CONTENT_SCAN
3506 unspool_mbox();
6f0c431a
PP
3507#endif
3508#ifdef EXPERIMENTAL_DCC
3509 dcc_ok = 0;
54cdb463 3510#endif
6ea85e9a
PH
3511 /* The ACL can specify where rejections are to be logged, possibly
3512 nowhere. The default is main and reject logs. */
3513
3514 if (log_reject_target != 0)
3515 log_write(0, log_reject_target, "F=<%s> rejected by non-SMTP ACL: %s",
3516 sender_address, log_msg);
3517
54cdb463
PH
3518 if (user_msg == NULL) user_msg = US"local configuration problem";
3519 if (smtp_batched_input)
3520 {
3521 moan_smtp_batch(NULL, "%d %s", 550, user_msg);
3522 /* Does not return */
3523 }
3524 else
3525 {
3526 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3527 give_local_error(ERRMESS_LOCAL_ACL, user_msg,
3528 US"message rejected by non-SMTP ACL: ", error_rc, data_file,
3529 header_list);
3530 /* Does not return */
3531 }
059ec3d9 3532 }
578d43dc 3533 add_acl_headers(ACL_WHERE_NOTSMTP, US"non-SMTP");
059ec3d9 3534 }
059ec3d9
PH
3535 }
3536
54cdb463
PH
3537 /* The applicable ACLs have been run */
3538
059ec3d9
PH
3539 if (deliver_freeze) frozen_by = US"ACL"; /* for later logging */
3540 if (queue_only_policy) queued_by = US"ACL";
059ec3d9
PH
3541 }
3542
8523533c
TK
3543#ifdef WITH_CONTENT_SCAN
3544unspool_mbox();
3545#endif
3546
6a8f9482
TK
3547#ifdef EXPERIMENTAL_DCC
3548dcc_ok = 0;
3549#endif
3550
3551
059ec3d9
PH
3552/* The final check on the message is to run the scan_local() function. The
3553version supplied with Exim always accepts, but this is a hook for sysadmins to
3554supply their own checking code. The local_scan() function is run even when all
3555the recipients have been discarded. */
3556
3557lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3558
3559/* Arrange to catch crashes in local_scan(), so that the -D file gets
3560deleted, and the incident gets logged. */
3561
3562os_non_restarting_signal(SIGSEGV, local_scan_crash_handler);
3563os_non_restarting_signal(SIGFPE, local_scan_crash_handler);
3564os_non_restarting_signal(SIGILL, local_scan_crash_handler);
3565os_non_restarting_signal(SIGBUS, local_scan_crash_handler);
3566
3567DEBUG(D_receive) debug_printf("calling local_scan(); timeout=%d\n",
3568 local_scan_timeout);
3569local_scan_data = NULL;
3570
3571os_non_restarting_signal(SIGALRM, local_scan_timeout_handler);
3572if (local_scan_timeout > 0) alarm(local_scan_timeout);
3573rc = local_scan(data_fd, &local_scan_data);
3574alarm(0);
3575os_non_restarting_signal(SIGALRM, sigalrm_handler);
3576
0e20aff9
MH
3577enable_dollar_recipients = FALSE;
3578
059ec3d9
PH
3579store_pool = POOL_MAIN; /* In case changed */
3580DEBUG(D_receive) debug_printf("local_scan() returned %d %s\n", rc,
3581 local_scan_data);
3582
3583os_non_restarting_signal(SIGSEGV, SIG_DFL);
3584os_non_restarting_signal(SIGFPE, SIG_DFL);
3585os_non_restarting_signal(SIGILL, SIG_DFL);
3586os_non_restarting_signal(SIGBUS, SIG_DFL);
3587
3588/* The length check is paranoia against some runaway code, and also because
3589(for a success return) lines in the spool file are read into big_buffer. */
3590
3591if (local_scan_data != NULL)
3592 {
3593 int len = Ustrlen(local_scan_data);
3594 if (len > LOCAL_SCAN_MAX_RETURN) len = LOCAL_SCAN_MAX_RETURN;
3595 local_scan_data = string_copyn(local_scan_data, len);
3596 }
3597
3598if (rc == LOCAL_SCAN_ACCEPT_FREEZE)
3599 {
58eb016e 3600 if (!deliver_freeze) /* ACL might have already frozen */
059ec3d9
PH
3601 {
3602 deliver_freeze = TRUE;
3603 deliver_frozen_at = time(NULL);
3604 frozen_by = US"local_scan()";
3605 }
3606 rc = LOCAL_SCAN_ACCEPT;
3607 }
3608else if (rc == LOCAL_SCAN_ACCEPT_QUEUE)
3609 {
3610 if (!queue_only_policy) /* ACL might have already queued */
3611 {
3612 queue_only_policy = TRUE;
3613 queued_by = US"local_scan()";
3614 }
3615 rc = LOCAL_SCAN_ACCEPT;
3616 }
3617
3618/* Message accepted: remove newlines in local_scan_data because otherwise
3619the spool file gets corrupted. Ensure that all recipients are qualified. */
3620
3621if (rc == LOCAL_SCAN_ACCEPT)
3622 {
3623 if (local_scan_data != NULL)
3624 {
3625 uschar *s;
3626 for (s = local_scan_data; *s != 0; s++) if (*s == '\n') *s = ' ';
3627 }
3628 for (i = 0; i < recipients_count; i++)
3629 {
3630 recipient_item *r = recipients_list + i;
3631 r->address = rewrite_address_qualify(r->address, TRUE);
3632 if (r->errors_to != NULL)
3633 r->errors_to = rewrite_address_qualify(r->errors_to, TRUE);
3634 }
3635 if (recipients_count == 0 && blackholed_by == NULL)
3636 blackholed_by = US"local_scan";
3637 }
3638
3639/* Message rejected: newlines permitted in local_scan_data to generate
3640multiline SMTP responses. */
3641
3642else
3643 {
3644 uschar *istemp = US"";
3645 uschar *s = NULL;
a5bd321b 3646 uschar *smtp_code;
059ec3d9
PH
3647 int size = 0;
3648 int sptr = 0;
059ec3d9
PH
3649
3650 errmsg = local_scan_data;
3651
3652 Uunlink(spool_name); /* Cancel this message */
3653 switch(rc)
3654 {
3655 default:
3656 log_write(0, LOG_MAIN, "invalid return %d from local_scan(). Temporary "
3657 "rejection given", rc);
3658 goto TEMPREJECT;
3659
3660 case LOCAL_SCAN_REJECT_NOLOGHDR:
6c6d6e48 3661 BIT_CLEAR(log_selector, log_selector_size, Li_rejected_header);
059ec3d9
PH
3662 /* Fall through */
3663
3664 case LOCAL_SCAN_REJECT:
a5bd321b 3665 smtp_code = US"550";
059ec3d9
PH
3666 if (errmsg == NULL) errmsg = US"Administrative prohibition";
3667 break;
3668
3669 case LOCAL_SCAN_TEMPREJECT_NOLOGHDR:
6c6d6e48 3670 BIT_CLEAR(log_selector, log_selector_size, Li_rejected_header);
059ec3d9
PH
3671 /* Fall through */
3672
3673 case LOCAL_SCAN_TEMPREJECT:
3674 TEMPREJECT:
a5bd321b 3675 smtp_code = US"451";
059ec3d9
PH
3676 if (errmsg == NULL) errmsg = US"Temporary local problem";
3677 istemp = US"temporarily ";
3678 break;
3679 }
3680
3681 s = string_append(s, &size, &sptr, 2, US"F=",
3682 (sender_address[0] == 0)? US"<>" : sender_address);
3683 s = add_host_info_for_log(s, &size, &sptr);
3684 s[sptr] = 0;
3685
3686 log_write(0, LOG_MAIN|LOG_REJECT, "%s %srejected by local_scan(): %.256s",
3687 s, istemp, string_printing(errmsg));
3688
3689 if (smtp_input)
3690 {
3691 if (!smtp_batched_input)
3692 {
a5bd321b 3693 smtp_respond(smtp_code, 3, TRUE, errmsg);
059ec3d9
PH
3694 message_id[0] = 0; /* Indicate no message accepted */
3695 smtp_reply = US""; /* Indicate reply already sent */
3696 goto TIDYUP; /* Skip to end of function */
3697 }
3698 else
3699 {
a5bd321b 3700 moan_smtp_batch(NULL, "%s %s", smtp_code, errmsg);
059ec3d9
PH
3701 /* Does not return */
3702 }
3703 }
3704 else
3705 {
3706 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3707 give_local_error(ERRMESS_LOCAL_SCAN, errmsg,
3708 US"message rejected by local scan code: ", error_rc, data_file,
3709 header_list);
3710 /* Does not return */
3711 }
3712 }
3713
3714/* Reset signal handlers to ignore signals that previously would have caused
3715the message to be abandoned. */
3716
3717signal(SIGTERM, SIG_IGN);
3718signal(SIGINT, SIG_IGN);
3719
e4bdf652 3720
059ec3d9
PH
3721/* Ensure the first time flag is set in the newly-received message. */
3722
3723deliver_firsttime = TRUE;
3724
8523533c 3725#ifdef EXPERIMENTAL_BRIGHTMAIL
a2da3176
JH
3726if (bmi_run == 1)
3727 { /* rewind data file */
8523533c
TK
3728 lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3729 bmi_verdicts = bmi_process_message(header_list, data_fd);
a2da3176 3730 }
8523533c
TK
3731#endif
3732
059ec3d9
PH
3733/* Update the timstamp in our Received: header to account for any time taken by
3734an ACL or by local_scan(). The new time is the time that all reception
3735processing is complete. */
3736
3737timestamp = expand_string(US"${tod_full}");
3738tslen = Ustrlen(timestamp);
3739
3740memcpy(received_header->text + received_header->slen - tslen - 1,
3741 timestamp, tslen);
3742
3743/* In MUA wrapper mode, ignore queueing actions set by ACL or local_scan() */
3744
3745if (mua_wrapper)
3746 {
3747 deliver_freeze = FALSE;
3748 queue_only_policy = FALSE;
3749 }
3750
3751/* Keep the data file open until we have written the header file, in order to
3752hold onto the lock. In a -bh run, or if the message is to be blackholed, we
3753don't write the header file, and we unlink the data file. If writing the header
3754file fails, we have failed to accept this message. */
3755
3756if (host_checking || blackholed_by != NULL)
3757 {
3758 header_line *h;
3759 Uunlink(spool_name);
3760 msg_size = 0; /* Compute size for log line */
3761 for (h = header_list; h != NULL; h = h->next)
3762 if (h->type != '*') msg_size += h->slen;
3763 }
3764
3765/* Write the -H file */
3766
3767else
059ec3d9
PH
3768 if ((msg_size = spool_write_header(message_id, SW_RECEIVING, &errmsg)) < 0)
3769 {
3770 log_write(0, LOG_MAIN, "Message abandoned: %s", errmsg);
3771 Uunlink(spool_name); /* Lose the data file */
3772
3773 if (smtp_input)
3774 {
3775 smtp_reply = US"451 Error in writing spool file";
3776 message_id[0] = 0; /* Indicate no message accepted */
3777 goto TIDYUP;
3778 }
3779 else
3780 {
3781 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3782 give_local_error(ERRMESS_IOERR, errmsg, US"", error_rc, data_file,
3783 header_list);
3784 /* Does not return */
3785 }
3786 }
059ec3d9
PH
3787
3788
3789/* The message has now been successfully received. */
3790
3791receive_messagecount++;
3792
3793/* In SMTP sessions we may receive several in one connection. After each one,
3794we wait for the clock to tick at the level of message-id granularity. This is
3795so that the combination of time+pid is unique, even on systems where the pid
3796can be re-used within our time interval. We can't shorten the interval without
3797re-designing the message-id. See comments above where the message id is
3798created. This is Something For The Future. */
3799
3800message_id_tv.tv_usec = (message_id_tv.tv_usec/id_resolution) * id_resolution;
3801exim_wait_tick(&message_id_tv, id_resolution);
3802
3803/* Add data size to written header size. We do not count the initial file name
3804that is in the file, but we do add one extra for the notional blank line that
3805precedes the data. This total differs from message_size in that it include the
3806added Received: header and any other headers that got created locally. */
3807
3808fflush(data_file);
3809fstat(data_fd, &statbuf);
3810
3811msg_size += statbuf.st_size - SPOOL_DATA_START_OFFSET + 1;
3812
3813/* Generate a "message received" log entry. We do this by building up a dynamic
3814string as required. Since we commonly want to add two items at a time, use a
3815macro to simplify the coding. We log the arrival of a new message while the
3816file is still locked, just in case the machine is *really* fast, and delivers
3817it first! Include any message id that is in the message - since the syntax of a
3818message id is actually an addr-spec, we can use the parse routine to canonicize
3819it. */
3820
3821size = 256;
3822sptr = 0;
3823s = store_get(size);
3824
27b9e5f4
JH
3825s = string_append(s, &size, &sptr, 2,
3826 fake_response == FAIL ? US"(= " : US"<= ",
3827 sender_address[0] == 0 ? US"<>" : sender_address);
3828if (message_reference)
059ec3d9
PH
3829 s = string_append(s, &size, &sptr, 2, US" R=", message_reference);
3830
3831s = add_host_info_for_log(s, &size, &sptr);
3832
3833#ifdef SUPPORT_TLS
6c6d6e48 3834if (LOGGING(tls_cipher) && tls_in.cipher)
817d9f57 3835 s = string_append(s, &size, &sptr, 2, US" X=", tls_in.cipher);
6c6d6e48 3836if (LOGGING(tls_certificate_verified) && tls_in.cipher)
059ec3d9 3837 s = string_append(s, &size, &sptr, 2, US" CV=",
27b9e5f4 3838 tls_in.certificate_verified ? "yes":"no");
6c6d6e48 3839if (LOGGING(tls_peerdn) && tls_in.peerdn)
48ed62d9 3840 s = string_append(s, &size, &sptr, 3, US" DN=\"",
817d9f57 3841 string_printing(tls_in.peerdn), US"\"");
6c6d6e48 3842if (LOGGING(tls_sni) && tls_in.sni)
3f0945ff 3843 s = string_append(s, &size, &sptr, 3, US" SNI=\"",
817d9f57 3844 string_printing(tls_in.sni), US"\"");
3f0945ff 3845#endif
059ec3d9 3846
8ccd00b1 3847if (sender_host_authenticated)
059ec3d9
PH
3848 {
3849 s = string_append(s, &size, &sptr, 2, US" A=", sender_host_authenticated);
27b9e5f4 3850 if (authenticated_id)
c8e2fc1e 3851 {
059ec3d9 3852 s = string_append(s, &size, &sptr, 2, US":", authenticated_id);
27b9e5f4 3853 if (LOGGING(smtp_mailauth) && authenticated_sender)
c8e2fc1e
JH
3854 s = string_append(s, &size, &sptr, 2, US":", authenticated_sender);
3855 }
059ec3d9
PH
3856 }
3857
8ccd00b1 3858#ifndef DISABLE_PRDR
fd98a5c6 3859if (prdr_requested)
7e3ce68e 3860 s = string_catn(s, &size, &sptr, US" PRDR", 5);
fd98a5c6 3861#endif
8ccd00b1 3862
cee5f132 3863#ifdef SUPPORT_PROXY
6c6d6e48 3864if (proxy_session && LOGGING(proxy))
e6d2a989 3865 s = string_append(s, &size, &sptr, 2, US" PRX=", proxy_local_address);
a3c86431 3866#endif
fd98a5c6 3867
7e3ce68e
JH
3868if (chunking_state > CHUNKING_OFFERED)
3869 s = string_catn(s, &size, &sptr, US" K", 2);
3870
059ec3d9
PH
3871sprintf(CS big_buffer, "%d", msg_size);
3872s = string_append(s, &size, &sptr, 2, US" S=", big_buffer);
3873
3c0a92dc
JH
3874/* log 8BITMIME mode announced in MAIL_FROM
3875 0 ... no BODY= used
3876 7 ... 7BIT
3877 8 ... 8BITMIME */
6c6d6e48 3878if (LOGGING(8bitmime))
c8e2fc1e 3879 {
3c0a92dc
JH
3880 sprintf(CS big_buffer, "%d", body_8bitmime);
3881 s = string_append(s, &size, &sptr, 2, US" M8S=", big_buffer);
c8e2fc1e 3882 }
3c0a92dc 3883
afa6d3ad
JH
3884if (*queue_name)
3885 s = string_append(s, &size, &sptr, 2, US" Q=", queue_name);
3886
059ec3d9
PH
3887/* If an addr-spec in a message-id contains a quoted string, it can contain
3888any characters except " \ and CR and so in particular it can contain NL!
3889Therefore, make sure we use a printing-characters only version for the log.
3890Also, allow for domain literals in the message id. */
3891
27b9e5f4 3892if (msgid_header)
059ec3d9
PH
3893 {
3894 uschar *old_id;
3895 BOOL save_allow_domain_literals = allow_domain_literals;
3896 allow_domain_literals = TRUE;
3897 old_id = parse_extract_address(Ustrchr(msgid_header->text, ':') + 1,
3898 &errmsg, &start, &end, &domain, FALSE);
3899 allow_domain_literals = save_allow_domain_literals;
3900 if (old_id != NULL)
3901 s = string_append(s, &size, &sptr, 2, US" id=", string_printing(old_id));
3902 }
3903
3904/* If subject logging is turned on, create suitable printing-character
3905text. By expanding $h_subject: we make use of the MIME decoding. */
3906
6c6d6e48 3907if (LOGGING(subject) && subject_header != NULL)
059ec3d9
PH
3908 {
3909 int i;
3910 uschar *p = big_buffer;
3911 uschar *ss = expand_string(US"$h_subject:");
3912
3913 /* Backslash-quote any double quotes or backslashes so as to make a
3914 a C-like string, and turn any non-printers into escape sequences. */
3915
3916 *p++ = '\"';
3917 if (*ss != 0) for (i = 0; i < 100 && ss[i] != 0; i++)
3918 {
3919 if (ss[i] == '\"' || ss[i] == '\\') *p++ = '\\';
3920 *p++ = ss[i];
3921 }
3922 *p++ = '\"';
3923 *p = 0;
3924 s = string_append(s, &size, &sptr, 2, US" T=", string_printing(big_buffer));
3925 }
3926
3927/* Terminate the string: string_cat() and string_append() leave room, but do
3928not put the zero in. */
3929
3930s[sptr] = 0;
3931
059ec3d9
PH
3932/* Create a message log file if message logs are being used and this message is
3933not blackholed. Write the reception stuff to it. We used to leave message log
e4bdf652 3934creation until the first delivery, but this has proved confusing for some
059ec3d9
PH
3935people. */
3936
3937if (message_logs && blackholed_by == NULL)
3938 {
3939 int fd;
3940
41313d92 3941 spool_name = spool_fname(US"msglog", message_subdir, message_id, US"");
a2da3176
JH
3942
3943 if ( (fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE)) < 0
3944 && errno == ENOENT
3945 )
059ec3d9 3946 {
41313d92
JH
3947 (void)directory_make(spool_directory,
3948 spool_sname(US"msglog", message_subdir),
3949 MSGLOG_DIRECTORY_MODE, TRUE);
059ec3d9
PH
3950 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3951 }
3952
3953 if (fd < 0)
3954 {
3955 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't open message log %s: %s",
3956 spool_name, strerror(errno));
3957 }
3958
3959 else
3960 {
3961 FILE *message_log = fdopen(fd, "a");
3962 if (message_log == NULL)
3963 {
3964 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't fdopen message log %s: %s",
3965 spool_name, strerror(errno));
f1e894f3 3966 (void)close(fd);
059ec3d9
PH
3967 }
3968 else
3969 {
3970 uschar *now = tod_stamp(tod_log);
3971 fprintf(message_log, "%s Received from %s\n", now, s+3);
3972 if (deliver_freeze) fprintf(message_log, "%s frozen by %s\n", now,
3973 frozen_by);
3974 if (queue_only_policy) fprintf(message_log,
e8012beb
JH
3975 "%s no immediate delivery: queued%s%s by %s\n", now,
3976 *queue_name ? " in " : "", *queue_name ? CS queue_name : "",
3977 queued_by);
f1e894f3 3978 (void)fclose(message_log);
059ec3d9
PH
3979 }
3980 }
3981 }
3982
58eb016e
PH
3983/* Everything has now been done for a successful message except logging its
3984arrival, and outputting an SMTP response. While writing to the log, set a flag
3985to cause a call to receive_bomb_out() if the log cannot be opened. */
3986
3987receive_call_bombout = TRUE;
3988
563b63fa
PH
3989/* Before sending an SMTP response in a TCP/IP session, we check to see if the
3990connection has gone away. This can only be done if there is no unconsumed input
3991waiting in the local input buffer. We can test for this by calling
3992receive_smtp_buffered(). RFC 2920 (pipelining) explicitly allows for additional
3993input to be sent following the final dot, so the presence of following input is
3994not an error.
58eb016e 3995
563b63fa
PH
3996If the connection is still present, but there is no unread input for the
3997socket, the result of a select() call will be zero. If, however, the connection
3998has gone away, or if there is pending input, the result of select() will be
3999non-zero. The two cases can be distinguished by trying to read the next input
4000character. If we succeed, we can unread it so that it remains in the local
4001buffer for handling later. If not, the connection has been lost.
58eb016e 4002
563b63fa
PH
4003Of course, since TCP/IP is asynchronous, there is always a chance that the
4004connection will vanish between the time of this test and the sending of the
4005response, but the chance of this happening should be small. */
4006
4007if (smtp_input && sender_host_address != NULL && !sender_host_notsocket &&
4008 !receive_smtp_buffered())
58eb016e
PH
4009 {
4010 struct timeval tv;
4011 fd_set select_check;
4012 FD_ZERO(&select_check);
4013 FD_SET(fileno(smtp_in), &select_check);
4014 tv.tv_sec = 0;
4015 tv.tv_usec = 0;
4016
563b63fa 4017 if (select(fileno(smtp_in) + 1, &select_check, NULL, NULL, &tv) != 0)
58eb016e 4018 {
80a47a2c
TK
4019 int c = (receive_getc)();
4020 if (c != EOF) (receive_ungetc)(c); else
58eb016e 4021 {
563b63fa
PH
4022 uschar *msg = US"SMTP connection lost after final dot";
4023 smtp_reply = US""; /* No attempt to send a response */
4024 smtp_yield = FALSE; /* Nothing more on this connection */
58eb016e 4025
563b63fa 4026 /* Re-use the log line workspace */
58eb016e 4027
563b63fa 4028 sptr = 0;
c2f669a4 4029 s = string_cat(s, &size, &sptr, msg);
563b63fa
PH
4030 s = add_host_info_for_log(s, &size, &sptr);
4031 s[sptr] = 0;
4032 log_write(0, LOG_MAIN, "%s", s);
58eb016e 4033
563b63fa 4034 /* Delete the files for this aborted message. */
58eb016e 4035
41313d92
JH
4036 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-D"));
4037 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-H"));
4038 Uunlink(spool_fname(US"msglog", message_subdir, message_id, US""));
58eb016e 4039
563b63fa
PH
4040 goto TIDYUP;
4041 }
58eb016e
PH
4042 }
4043 }
4044
4045/* The connection has not gone away; we really are going to take responsibility
4046for this message. */
4047
817d9f57 4048/* Cutthrough - had sender last-dot; assume we've sent (or bufferred) all
e4bdf652
JH
4049 data onward by now.
4050
817d9f57 4051 Send dot onward. If accepted, wipe the spooled files, log as delivered and accept
e4bdf652 4052 the sender's dot (below).
817d9f57
JH
4053 If rejected: copy response to sender, wipe the spooled files, log approriately.
4054 If temp-reject: accept to sender, keep the spooled files.
e4bdf652
JH
4055
4056 Having the normal spool files lets us do data-filtering, and store/forward on temp-reject.
817d9f57
JH
4057
4058 XXX We do not handle queue-only, freezing, or blackholes.
e4bdf652 4059*/
5032d1cf 4060if(cutthrough.fd >= 0)
e4bdf652 4061 {
85ffcba6 4062 uschar * msg= cutthrough_finaldot(); /* Ask the target system to accept the message */
817d9f57 4063 /* Logging was done in finaldot() */
e4bdf652 4064 switch(msg[0])
817d9f57
JH
4065 {
4066 case '2': /* Accept. Do the same to the source; dump any spoolfiles. */
b784ce7f 4067 cutthrough_done = ACCEPTED;
817d9f57 4068 break; /* message_id needed for SMTP accept below */
61147df4 4069
817d9f57
JH
4070 default: /* Unknown response, or error. Treat as temp-reject. */
4071 case '4': /* Temp-reject. Keep spoolfiles and accept. */
b784ce7f 4072 cutthrough_done = TMP_REJ; /* Avoid the usual immediate delivery attempt */
817d9f57 4073 break; /* message_id needed for SMTP accept below */
61147df4 4074
817d9f57
JH
4075 case '5': /* Perm-reject. Do the same to the source. Dump any spoolfiles */
4076 smtp_reply= msg; /* Pass on the exact error */
b784ce7f 4077 cutthrough_done = PERM_REJ;
817d9f57
JH
4078 break;
4079 }
e4bdf652 4080 }
58eb016e 4081
8ccd00b1
JH
4082#ifndef DISABLE_PRDR
4083if(!smtp_reply || prdr_requested)
4084#else
4085if(!smtp_reply)
fd98a5c6 4086#endif
e4bdf652
JH
4087 {
4088 log_write(0, LOG_MAIN |
6c6d6e48
TF
4089 (LOGGING(received_recipients)? LOG_RECIPIENTS : 0) |
4090 (LOGGING(received_sender)? LOG_SENDER : 0),
e4bdf652
JH
4091 "%s", s);
4092
4093 /* Log any control actions taken by an ACL or local_scan(). */
58eb016e 4094
e4bdf652
JH
4095 if (deliver_freeze) log_write(0, LOG_MAIN, "frozen by %s", frozen_by);
4096 if (queue_only_policy) log_write(L_delay_delivery, LOG_MAIN,
e8012beb
JH
4097 "no immediate delivery: queued%s%s by %s",
4098 *queue_name ? " in " : "", *queue_name ? CS queue_name : "",
4099 queued_by);
e4bdf652
JH
4100 }
4101receive_call_bombout = FALSE;
58eb016e 4102
059ec3d9
PH
4103store_reset(s); /* The store for the main log message can be reused */
4104
4105/* If the message is frozen, and freeze_tell is set, do the telling. */
4106
4107if (deliver_freeze && freeze_tell != NULL && freeze_tell[0] != 0)
4108 {
4109 moan_tell_someone(freeze_tell, NULL, US"Message frozen on arrival",
4110 "Message %s was frozen on arrival by %s.\nThe sender is <%s>.\n",
4111 message_id, frozen_by, sender_address);
4112 }
4113
4114
4115/* Either a message has been successfully received and written to the two spool
4116files, or an error in writing the spool has occurred for an SMTP message, or
58eb016e
PH
4117an SMTP message has been rejected for policy reasons. (For a non-SMTP message
4118we will have already given up because there's no point in carrying on!) In
4119either event, we must now close (and thereby unlock) the data file. In the
059ec3d9
PH
4120successful case, this leaves the message on the spool, ready for delivery. In
4121the error case, the spool file will be deleted. Then tidy up store, interact
4122with an SMTP call if necessary, and return.
4123
4124A fflush() was done earlier in the expectation that any write errors on the
4125data file will be flushed(!) out thereby. Nevertheless, it is theoretically
4126possible for fclose() to fail - but what to do? What has happened to the lock
4127if this happens? */
4128
e4bdf652 4129
059ec3d9 4130TIDYUP:
f1e894f3
PH
4131process_info[process_info_len] = 0; /* Remove message id */
4132if (data_file != NULL) (void)fclose(data_file); /* Frees the lock */
059ec3d9
PH
4133
4134/* Now reset signal handlers to their defaults */
4135
4136signal(SIGTERM, SIG_DFL);
4137signal(SIGINT, SIG_DFL);
4138
4139/* Tell an SMTP caller the state of play, and arrange to return the SMTP return
4140value, which defaults TRUE - meaning there may be more incoming messages from
4141this connection. For non-SMTP callers (where there is only ever one message),
4142the default is FALSE. */
4143
4144if (smtp_input)
4145 {
4146 yield = smtp_yield;
4147
4148 /* Handle interactive SMTP callers. After several kinds of error, smtp_reply
58eb016e
PH
4149 is set to the response that should be sent. When it is NULL, we generate
4150 default responses. After an ACL error or local_scan() error, the response has
4151 already been sent, and smtp_reply is an empty string to indicate this. */
059ec3d9
PH
4152
4153 if (!smtp_batched_input)
4154 {
27b9e5f4 4155 if (!smtp_reply)
059ec3d9 4156 {
29aba418 4157 if (fake_response != OK)
27b9e5f4
JH
4158 smtp_respond(fake_response == DEFER ? US"450" : US"550",
4159 3, TRUE, fake_response_text);
4e88a19f
PH
4160
4161 /* An OK response is required; use "message" text if present. */
4162
27b9e5f4 4163 else if (user_msg)
4e88a19f
PH
4164 {
4165 uschar *code = US"250";
4166 int len = 3;
4f6ae5c3 4167 smtp_message_code(&code, &len, &user_msg, NULL, TRUE);
4e88a19f
PH
4168 smtp_respond(code, len, TRUE, user_msg);
4169 }
4170
4171 /* Default OK response */
4172
7e3ce68e
JH
4173 else if (chunking_state > CHUNKING_OFFERED)
4174 {
4175 smtp_printf("250- %u byte chunk, total %d\r\n250 OK id=%s\r\n",
4176 chunking_datasize, message_size+message_linecount, message_id);
4177 chunking_state = CHUNKING_OFFERED;
4178 }
8e669ac1
PH
4179 else
4180 smtp_printf("250 OK id=%s\r\n", message_id);
7e3ce68e 4181
059ec3d9
PH
4182 if (host_checking)
4183 fprintf(stdout,
4184 "\n**** SMTP testing: that is not a real message id!\n\n");
4185 }
4e88a19f 4186
58eb016e 4187 /* smtp_reply is set non-empty */
4e88a19f 4188
8523533c
TK
4189 else if (smtp_reply[0] != 0)
4190 {
29aba418 4191 if (fake_response != OK && (smtp_reply[0] == '2'))
a5bd321b
PH
4192 smtp_respond((fake_response == DEFER)? US"450" : US"550", 3, TRUE,
4193 fake_response_text);
8e669ac1 4194 else
6951ac6c
PH
4195 smtp_printf("%.1024s\r\n", smtp_reply);
4196 }
e4bdf652 4197
817d9f57
JH
4198 switch (cutthrough_done)
4199 {
b784ce7f 4200 case ACCEPTED: log_write(0, LOG_MAIN, "Completed");/* Delivery was done */
41313d92
JH
4201 case PERM_REJ:
4202 { /* Delete spool files */
4203 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-D"));
4204 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-H"));
4205 Uunlink(spool_fname(US"msglog", message_subdir, message_id, US""));
817d9f57 4206 }
b784ce7f 4207 case TMP_REJ: message_id[0] = 0; /* Prevent a delivery from starting */
817d9f57 4208 default:break;
e4bdf652 4209 }
5032d1cf 4210 cutthrough.delivery = FALSE;
059ec3d9
PH
4211 }
4212
4213 /* For batched SMTP, generate an error message on failure, and do
4214 nothing on success. The function moan_smtp_batch() does not return -
4215 it exits from the program with a non-zero return code. */
4216
27b9e5f4
JH
4217 else if (smtp_reply)
4218 moan_smtp_batch(NULL, "%s", smtp_reply);
059ec3d9
PH
4219 }
4220
4221
4222/* If blackholing, we can immediately log this message's sad fate. The data
4223file has already been unlinked, and the header file was never written to disk.
4224We must now indicate that nothing was received, to prevent a delivery from
4225starting. */
4226
27b9e5f4 4227if (blackholed_by)
059ec3d9 4228 {
55414b25
JH
4229 const uschar *detail = local_scan_data
4230 ? string_printing(local_scan_data)
4231 : string_sprintf("(%s discarded recipients)", blackholed_by);
04f7d5b9 4232 log_write(0, LOG_MAIN, "=> blackhole %s%s", detail, blackhole_log_msg);
059ec3d9
PH
4233 log_write(0, LOG_MAIN, "Completed");
4234 message_id[0] = 0;
4235 }
4236
4237/* Reset headers so that logging of rejects for a subsequent message doesn't
4238include them. It is also important to set header_last = NULL before exiting
4239from this function, as this prevents certain rewrites that might happen during
4240subsequent verifying (of another incoming message) from trying to add headers
4241when they shouldn't. */
4242
4243header_list = header_last = NULL;
4244
4245return yield; /* TRUE if more messages (SMTP only) */
4246}
4247
4248/* End of receive.c */