Fix buffer overrun in spam= acl condition. Bug 1552
[exim.git] / src / src / receive.c
CommitLineData
059ec3d9
PH
1/*************************************************
2* Exim - an Internet mail transport agent *
3*************************************************/
4
2331cfe7 5/* Copyright (c) University of Cambridge 1995 - 2014 */
059ec3d9
PH
6/* See the file NOTICE for conditions of use and distribution. */
7
8/* Code for receiving a message and setting up spool files. */
9
059ec3d9
PH
10#include "exim.h"
11
6a8f9482
TK
12#ifdef EXPERIMENTAL_DCC
13extern int dcc_ok;
14#endif
15
4840604e 16#ifdef EXPERIMENTAL_DMARC
c007c974 17# include "dmarc.h"
4840604e
TL
18#endif /* EXPERIMENTAL_DMARC */
19
059ec3d9
PH
20/*************************************************
21* Local static variables *
22*************************************************/
23
24static FILE *data_file = NULL;
25static int data_fd = -1;
26static uschar spool_name[256];
27
28
29
30/*************************************************
31* Non-SMTP character reading functions *
32*************************************************/
33
34/* These are the default functions that are set up in the variables such as
35receive_getc initially. They just call the standard functions, passing stdin as
36the file. (When SMTP input is occurring, different functions are used by
37changing the pointer variables.) */
38
39int
40stdin_getc(void)
41{
42return getc(stdin);
43}
44
45int
46stdin_ungetc(int c)
47{
48return ungetc(c, stdin);
49}
50
51int
52stdin_feof(void)
53{
54return feof(stdin);
55}
56
57int
58stdin_ferror(void)
59{
60return ferror(stdin);
61}
62
63
64
65
66/*************************************************
67* Check that a set sender is allowed *
68*************************************************/
69
70/* This function is called when a local caller sets an explicit sender address.
71It checks whether this is permitted, which it is for trusted callers.
72Otherwise, it must match the pattern(s) in untrusted_set_sender.
73
74Arguments: the proposed sender address
75Returns: TRUE for a trusted caller
76 TRUE if the address has been set, untrusted_set_sender has been
77 set, and the address matches something in the list
78 FALSE otherwise
79*/
80
81BOOL
82receive_check_set_sender(uschar *newsender)
83{
84uschar *qnewsender;
85if (trusted_caller) return TRUE;
86if (newsender == NULL || untrusted_set_sender == NULL) return FALSE;
87qnewsender = (Ustrchr(newsender, '@') != NULL)?
88 newsender : string_sprintf("%s@%s", newsender, qualify_domain_sender);
89return
90 match_address_list(qnewsender, TRUE, TRUE, &untrusted_set_sender, NULL, -1,
91 0, NULL) == OK;
92}
93
94
95
96
97/*************************************************
5cb8cbc6 98* Read space info for a partition *
059ec3d9
PH
99*************************************************/
100
8e669ac1
PH
101/* This function is called by receive_check_fs() below, and also by string
102expansion for variables such as $spool_space. The field names for the statvfs
5cb8cbc6
PH
103structure are macros, because not all OS have F_FAVAIL and it seems tidier to
104have macros for F_BAVAIL and F_FILES as well. Some kinds of file system do not
105have inodes, and they return -1 for the number available.
059ec3d9 106
5cb8cbc6
PH
107Later: It turns out that some file systems that do not have the concept of
108inodes return 0 rather than -1. Such systems should also return 0 for the total
8e669ac1 109number of inodes, so we require that to be greater than zero before returning
5cb8cbc6 110an inode count.
059ec3d9 111
5cb8cbc6
PH
112Arguments:
113 isspool TRUE for spool partition, FALSE for log partition
114 inodeptr address of int to receive inode count; -1 if there isn't one
8e669ac1 115
5cb8cbc6 116Returns: available on-root space, in kilobytes
8e669ac1
PH
117 -1 for log partition if there isn't one
118
119All values are -1 if the STATFS functions are not available.
059ec3d9
PH
120*/
121
8e669ac1 122int
5cb8cbc6 123receive_statvfs(BOOL isspool, int *inodeptr)
059ec3d9
PH
124{
125#ifdef HAVE_STATFS
059ec3d9 126struct STATVFS statbuf;
5cb8cbc6
PH
127uschar *path;
128uschar *name;
129uschar buffer[1024];
059ec3d9 130
5cb8cbc6 131/* The spool directory must always exist. */
059ec3d9 132
5cb8cbc6 133if (isspool)
059ec3d9 134 {
8e669ac1
PH
135 path = spool_directory;
136 name = US"spool";
137 }
138
059ec3d9
PH
139/* Need to cut down the log file path to the directory, and to ignore any
140appearance of "syslog" in it. */
141
5cb8cbc6 142else
059ec3d9 143 {
059ec3d9 144 int sep = ':'; /* Not variable - outside scripts use */
059ec3d9 145 uschar *p = log_file_path;
8e669ac1 146 name = US"log";
059ec3d9
PH
147
148 /* An empty log_file_path means "use the default". This is the same as an
149 empty item in a list. */
150
151 if (*p == 0) p = US":";
152 while ((path = string_nextinlist(&p, &sep, buffer, sizeof(buffer))) != NULL)
153 {
154 if (Ustrcmp(path, "syslog") != 0) break;
155 }
156
5cb8cbc6
PH
157 if (path == NULL) /* No log files */
158 {
8e669ac1
PH
159 *inodeptr = -1;
160 return -1;
161 }
059ec3d9 162
8e669ac1
PH
163 /* An empty string means use the default, which is in the spool directory.
164 But don't just use the spool directory, as it is possible that the log
5cb8cbc6 165 subdirectory has been symbolically linked elsewhere. */
059ec3d9 166
8e669ac1 167 if (path[0] == 0)
059ec3d9 168 {
5cb8cbc6
PH
169 sprintf(CS buffer, CS"%s/log", CS spool_directory);
170 path = buffer;
8e669ac1
PH
171 }
172 else
059ec3d9 173 {
8e669ac1 174 uschar *cp;
5cb8cbc6 175 if ((cp = Ustrrchr(path, '/')) != NULL) *cp = 0;
8e669ac1 176 }
5cb8cbc6 177 }
8e669ac1 178
8f128379 179/* We now have the path; do the business */
5cb8cbc6
PH
180
181memset(&statbuf, 0, sizeof(statbuf));
182
183if (STATVFS(CS path, &statbuf) != 0)
184 {
185 log_write(0, LOG_MAIN|LOG_PANIC, "cannot accept message: failed to stat "
186 "%s directory %s: %s", name, spool_directory, strerror(errno));
187 smtp_closedown(US"spool or log directory problem");
188 exim_exit(EXIT_FAILURE);
189 }
8e669ac1 190
5cb8cbc6
PH
191*inodeptr = (statbuf.F_FILES > 0)? statbuf.F_FAVAIL : -1;
192
193/* Disks are getting huge. Take care with computing the size in kilobytes. */
8e669ac1 194
5cb8cbc6
PH
195return (int)(((double)statbuf.F_BAVAIL * (double)statbuf.F_FRSIZE)/1024.0);
196
197/* Unable to find partition sizes in this environment. */
198
199#else
200*inodeptr = -1;
201return -1;
202#endif
203}
204
059ec3d9 205
059ec3d9 206
5cb8cbc6
PH
207
208/*************************************************
209* Check space on spool and log partitions *
210*************************************************/
211
212/* This function is called before accepting a message; if any thresholds are
213set, it checks them. If a message_size is supplied, it checks that there is
214enough space for that size plus the threshold - i.e. that the message won't
215reduce the space to the threshold. Not all OS have statvfs(); for those that
216don't, this function always returns TRUE. For some OS the old function and
217struct name statfs is used; that is handled by a macro, defined in exim.h.
218
219Arguments:
220 msg_size the (estimated) size of an incoming message
221
222Returns: FALSE if there isn't enough space, or if the information cannot
223 be obtained
224 TRUE if no check was done or there is enough space
225*/
226
227BOOL
228receive_check_fs(int msg_size)
229{
230int space, inodes;
231
232if (check_spool_space > 0 || msg_size > 0 || check_spool_inodes > 0)
233 {
8e669ac1
PH
234 space = receive_statvfs(TRUE, &inodes);
235
059ec3d9 236 DEBUG(D_receive)
5cb8cbc6
PH
237 debug_printf("spool directory space = %dK inodes = %d "
238 "check_space = %dK inodes = %d msg_size = %d\n",
239 space, inodes, check_spool_space, check_spool_inodes, msg_size);
8e669ac1
PH
240
241 if ((space >= 0 && space < check_spool_space) ||
5cb8cbc6 242 (inodes >= 0 && inodes < check_spool_inodes))
8e669ac1 243 {
5cb8cbc6
PH
244 log_write(0, LOG_MAIN, "spool directory space check failed: space=%d "
245 "inodes=%d", space, inodes);
059ec3d9
PH
246 return FALSE;
247 }
248 }
249
5cb8cbc6
PH
250if (check_log_space > 0 || check_log_inodes > 0)
251 {
8e669ac1
PH
252 space = receive_statvfs(FALSE, &inodes);
253
5cb8cbc6
PH
254 DEBUG(D_receive)
255 debug_printf("log directory space = %dK inodes = %d "
256 "check_space = %dK inodes = %d\n",
257 space, inodes, check_log_space, check_log_inodes);
8e669ac1
PH
258
259 if ((space >= 0 && space < check_log_space) ||
5cb8cbc6 260 (inodes >= 0 && inodes < check_log_inodes))
8e669ac1 261 {
5cb8cbc6
PH
262 log_write(0, LOG_MAIN, "log directory space check failed: space=%d "
263 "inodes=%d", space, inodes);
264 return FALSE;
265 }
8e669ac1
PH
266 }
267
059ec3d9
PH
268return TRUE;
269}
270
271
272
273/*************************************************
274* Bomb out while reading a message *
275*************************************************/
276
277/* The common case of wanting to bomb out is if a SIGTERM or SIGINT is
278received, or if there is a timeout. A rarer case might be if the log files are
279screwed up and Exim can't open them to record a message's arrival. Handling
280that case is done by setting a flag to cause the log functions to call this
281function if there is an ultimate disaster. That is why it is globally
282accessible.
283
8f128379
PH
284Arguments:
285 reason text reason to pass to the not-quit ACL
286 msg default SMTP response to give if in an SMTP session
059ec3d9
PH
287Returns: it doesn't
288*/
289
290void
8f128379 291receive_bomb_out(uschar *reason, uschar *msg)
059ec3d9 292{
ead37e6c
PP
293 static BOOL already_bombing_out;
294/* The smtp_notquit_exit() below can call ACLs which can trigger recursive
295timeouts, if someone has something slow in their quit ACL. Since the only
296things we should be doing are to close down cleanly ASAP, on the second
297pass we also close down stuff that might be opened again, before bypassing
298the ACL call and exiting. */
299
059ec3d9
PH
300/* If spool_name is set, it contains the name of the data file that is being
301written. Unlink it before closing so that it cannot be picked up by a delivery
302process. Ensure that any header file is also removed. */
303
ead37e6c 304if (spool_name[0] != '\0')
059ec3d9
PH
305 {
306 Uunlink(spool_name);
307 spool_name[Ustrlen(spool_name) - 1] = 'H';
308 Uunlink(spool_name);
ead37e6c 309 spool_name[0] = '\0';
059ec3d9
PH
310 }
311
312/* Now close the file if it is open, either as a fd or a stream. */
313
ead37e6c
PP
314if (data_file != NULL)
315 {
316 (void)fclose(data_file);
317 data_file = NULL;
318} else if (data_fd >= 0) {
319 (void)close(data_fd);
320 data_fd = -1;
321 }
059ec3d9 322
8f128379
PH
323/* Attempt to close down an SMTP connection tidily. For non-batched SMTP, call
324smtp_notquit_exit(), which runs the NOTQUIT ACL, if present, and handles the
325SMTP response. */
059ec3d9 326
ead37e6c 327if (!already_bombing_out)
059ec3d9 328 {
ead37e6c
PP
329 already_bombing_out = TRUE;
330 if (smtp_input)
331 {
332 if (smtp_batched_input)
333 moan_smtp_batch(NULL, "421 %s - message abandoned", msg); /* No return */
334 smtp_notquit_exit(reason, US"421", US"%s %s - closing connection.",
335 smtp_active_hostname, msg);
336 }
059ec3d9
PH
337 }
338
339/* Exit from the program (non-BSMTP cases) */
340
341exim_exit(EXIT_FAILURE);
342}
343
344
345/*************************************************
346* Data read timeout *
347*************************************************/
348
349/* Handler function for timeouts that occur while reading the data that
350comprises a message.
351
352Argument: the signal number
353Returns: nothing
354*/
355
356static void
357data_timeout_handler(int sig)
358{
359uschar *msg = NULL;
360
361sig = sig; /* Keep picky compilers happy */
362
363if (smtp_input)
364 {
365 msg = US"SMTP incoming data timeout";
366 log_write(L_lost_incoming_connection,
367 LOG_MAIN, "SMTP data timeout (message abandoned) on connection "
fed77020
PH
368 "from %s F=<%s>",
369 (sender_fullhost != NULL)? sender_fullhost : US"local process",
370 sender_address);
059ec3d9
PH
371 }
372else
373 {
374 fprintf(stderr, "exim: timed out while reading - message abandoned\n");
375 log_write(L_lost_incoming_connection,
376 LOG_MAIN, "timed out while reading local message");
377 }
378
8f128379 379receive_bomb_out(US"data-timeout", msg); /* Does not return */
059ec3d9
PH
380}
381
382
383
384/*************************************************
385* local_scan() timeout *
386*************************************************/
387
388/* Handler function for timeouts that occur while running a local_scan()
389function.
390
391Argument: the signal number
392Returns: nothing
393*/
394
395static void
396local_scan_timeout_handler(int sig)
397{
398sig = sig; /* Keep picky compilers happy */
399log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function timed out - "
400 "message temporarily rejected (size %d)", message_size);
8f128379
PH
401/* Does not return */
402receive_bomb_out(US"local-scan-timeout", US"local verification problem");
059ec3d9
PH
403}
404
405
406
407/*************************************************
408* local_scan() crashed *
409*************************************************/
410
411/* Handler function for signals that occur while running a local_scan()
412function.
413
414Argument: the signal number
415Returns: nothing
416*/
417
418static void
419local_scan_crash_handler(int sig)
420{
421log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function crashed with "
422 "signal %d - message temporarily rejected (size %d)", sig, message_size);
8f128379
PH
423/* Does not return */
424receive_bomb_out(US"local-scan-error", US"local verification problem");
059ec3d9
PH
425}
426
427
428/*************************************************
429* SIGTERM or SIGINT received *
430*************************************************/
431
432/* Handler for SIGTERM or SIGINT signals that occur while reading the
433data that comprises a message.
434
435Argument: the signal number
436Returns: nothing
437*/
438
439static void
440data_sigterm_sigint_handler(int sig)
441{
442uschar *msg = NULL;
443
444if (smtp_input)
445 {
446 msg = US"Service not available - SIGTERM or SIGINT received";
447 log_write(0, LOG_MAIN, "%s closed after %s", smtp_get_connection_info(),
448 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
449 }
450else
451 {
f05da2e8 452 if (filter_test == FTEST_NONE)
059ec3d9
PH
453 {
454 fprintf(stderr, "\nexim: %s received - message abandoned\n",
455 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
456 log_write(0, LOG_MAIN, "%s received while reading local message",
457 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
458 }
459 }
460
8f128379 461receive_bomb_out(US"signal-exit", msg); /* Does not return */
059ec3d9
PH
462}
463
464
465
466/*************************************************
467* Add new recipient to list *
468*************************************************/
469
470/* This function builds a list of recipient addresses in argc/argv
471format.
472
473Arguments:
474 recipient the next address to add to recipients_list
475 pno parent number for fixed aliases; -1 otherwise
476
477Returns: nothing
478*/
479
480void
481receive_add_recipient(uschar *recipient, int pno)
482{
483if (recipients_count >= recipients_list_max)
484 {
485 recipient_item *oldlist = recipients_list;
486 int oldmax = recipients_list_max;
487 recipients_list_max = recipients_list_max? 2*recipients_list_max : 50;
488 recipients_list = store_get(recipients_list_max * sizeof(recipient_item));
489 if (oldlist != NULL)
490 memcpy(recipients_list, oldlist, oldmax * sizeof(recipient_item));
491 }
492
493recipients_list[recipients_count].address = recipient;
494recipients_list[recipients_count].pno = pno;
8523533c
TK
495#ifdef EXPERIMENTAL_BRIGHTMAIL
496recipients_list[recipients_count].bmi_optin = bmi_current_optin;
497/* reset optin string pointer for next recipient */
498bmi_current_optin = NULL;
499#endif
6c1c3d1d
WB
500#ifdef EXPERIMENTAL_DSN
501recipients_list[recipients_count].orcpt = NULL;
502recipients_list[recipients_count].dsn_flags = 0;
503#endif
059ec3d9
PH
504recipients_list[recipients_count++].errors_to = NULL;
505}
506
507
508
509
fd98a5c6
JH
510/*************************************************
511* Send user response message *
512*************************************************/
61147df4 513
fd98a5c6
JH
514/* This function is passed a default response code and a user message. It calls
515smtp_message_code() to check and possibly modify the response code, and then
516calls smtp_respond() to transmit the response. I put this into a function
517just to avoid a lot of repetition.
61147df4
PP
518
519Arguments:
fd98a5c6
JH
520 code the response code
521 user_msg the user message
522
523Returns: nothing
61147df4
PP
524*/
525
8ccd00b1 526#ifndef DISABLE_PRDR
61147df4 527static void
fd98a5c6 528smtp_user_msg(uschar *code, uschar *user_msg)
61147df4 529{
fd98a5c6
JH
530int len = 3;
531smtp_message_code(&code, &len, &user_msg, NULL);
532smtp_respond(code, len, TRUE, user_msg);
61147df4
PP
533}
534#endif
535
536
537
538
fd98a5c6 539
059ec3d9
PH
540/*************************************************
541* Remove a recipient from the list *
542*************************************************/
543
544/* This function is provided for local_scan() to use.
545
546Argument:
547 recipient address to remove
548
549Returns: TRUE if it did remove something; FALSE otherwise
550*/
551
552BOOL
553receive_remove_recipient(uschar *recipient)
554{
555int count;
556DEBUG(D_receive) debug_printf("receive_remove_recipient(\"%s\") called\n",
557 recipient);
558for (count = 0; count < recipients_count; count++)
559 {
560 if (Ustrcmp(recipients_list[count].address, recipient) == 0)
561 {
562 if ((--recipients_count - count) > 0)
563 memmove(recipients_list + count, recipients_list + count + 1,
54cdb463 564 (recipients_count - count)*sizeof(recipient_item));
059ec3d9
PH
565 return TRUE;
566 }
567 }
568return FALSE;
569}
570
571
572
573
574
575/*************************************************
576* Read data portion of a non-SMTP message *
577*************************************************/
578
579/* This function is called to read the remainder of a message (following the
580header) when the input is not from SMTP - we are receiving a local message on
581a standard input stream. The message is always terminated by EOF, and is also
582terminated by a dot on a line by itself if the flag dot_ends is TRUE. Split the
583two cases for maximum efficiency.
584
585Ensure that the body ends with a newline. This will naturally be the case when
586the termination is "\n.\n" but may not be otherwise. The RFC defines messages
587as "sequences of lines" - this of course strictly applies only to SMTP, but
588deliveries into BSD-type mailbox files also require it. Exim used to have a
589flag for doing this at delivery time, but as it was always set for all
590transports, I decided to simplify things by putting the check here instead.
591
592There is at least one MUA (dtmail) that sends CRLF via this interface, and
593other programs are known to do this as well. Exim used to have a option for
594dealing with this: in July 2003, after much discussion, the code has been
595changed to default to treat any of LF, CRLF, and bare CR as line terminators.
596
597However, for the case when a dot on a line by itself terminates a message, the
598only recognized terminating sequences before and after the dot are LF and CRLF.
599Otherwise, having read EOL . CR, you don't know whether to read another
600character or not.
601
602Internally, in messages stored in Exim's spool files, LF is used as the line
603terminator. Under the new regime, bare CRs will no longer appear in these
604files.
605
606Arguments:
607 fout a FILE to which to write the message
608
609Returns: One of the END_xxx values indicating why it stopped reading
610*/
611
612static int
613read_message_data(FILE *fout)
614{
615int ch_state;
616register int ch;
d677b2f2 617register int linelength = 0;
059ec3d9
PH
618
619/* Handle the case when only EOF terminates the message */
620
621if (!dot_ends)
622 {
623 register int last_ch = '\n';
624
80a47a2c 625 for (; (ch = (receive_getc)()) != EOF; last_ch = ch)
059ec3d9
PH
626 {
627 if (ch == 0) body_zerocount++;
628 if (last_ch == '\r' && ch != '\n')
629 {
d677b2f2
PH
630 if (linelength > max_received_linelength)
631 max_received_linelength = linelength;
632 linelength = 0;
059ec3d9
PH
633 if (fputc('\n', fout) == EOF) return END_WERROR;
634 message_size++;
635 body_linecount++;
636 }
637 if (ch == '\r') continue;
638
639 if (fputc(ch, fout) == EOF) return END_WERROR;
d677b2f2
PH
640 if (ch == '\n')
641 {
642 if (linelength > max_received_linelength)
643 max_received_linelength = linelength;
644 linelength = 0;
645 body_linecount++;
646 }
647 else linelength++;
059ec3d9
PH
648 if (++message_size > thismessage_size_limit) return END_SIZE;
649 }
650
651 if (last_ch != '\n')
652 {
d677b2f2
PH
653 if (linelength > max_received_linelength)
654 max_received_linelength = linelength;
059ec3d9
PH
655 if (fputc('\n', fout) == EOF) return END_WERROR;
656 message_size++;
657 body_linecount++;
658 }
659
660 return END_EOF;
661 }
662
663/* Handle the case when a dot on a line on its own, or EOF, terminates. */
664
665ch_state = 1;
666
80a47a2c 667while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
668 {
669 if (ch == 0) body_zerocount++;
670 switch (ch_state)
671 {
672 case 0: /* Normal state (previous char written) */
673 if (ch == '\n')
d677b2f2
PH
674 {
675 body_linecount++;
676 if (linelength > max_received_linelength)
677 max_received_linelength = linelength;
678 linelength = -1;
679 ch_state = 1;
680 }
059ec3d9
PH
681 else if (ch == '\r')
682 { ch_state = 2; continue; }
683 break;
684
685 case 1: /* After written "\n" */
686 if (ch == '.') { ch_state = 3; continue; }
6eb02f88 687 if (ch == '\r') { ch_state = 2; continue; }
d677b2f2 688 if (ch != '\n') ch_state = 0; else linelength = -1;
059ec3d9
PH
689 break;
690
691 case 2:
692 body_linecount++; /* After unwritten "\r" */
d677b2f2
PH
693 if (linelength > max_received_linelength)
694 max_received_linelength = linelength;
059ec3d9 695 if (ch == '\n')
d677b2f2
PH
696 {
697 ch_state = 1;
698 linelength = -1;
699 }
059ec3d9
PH
700 else
701 {
702 if (message_size++, fputc('\n', fout) == EOF) return END_WERROR;
703 if (ch == '\r') continue;
704 ch_state = 0;
d677b2f2 705 linelength = 0;
059ec3d9
PH
706 }
707 break;
708
709 case 3: /* After "\n." (\n written, dot not) */
710 if (ch == '\n') return END_DOT;
711 if (ch == '\r') { ch_state = 4; continue; }
712 message_size++;
d677b2f2 713 linelength++;
059ec3d9
PH
714 if (fputc('.', fout) == EOF) return END_WERROR;
715 ch_state = 0;
716 break;
717
718 case 4: /* After "\n.\r" (\n written, rest not) */
719 if (ch == '\n') return END_DOT;
720 message_size += 2;
721 body_linecount++;
722 if (fputs(".\n", fout) == EOF) return END_WERROR;
723 if (ch == '\r') { ch_state = 2; continue; }
724 ch_state = 0;
725 break;
726 }
727
d677b2f2 728 linelength++;
059ec3d9
PH
729 if (fputc(ch, fout) == EOF) return END_WERROR;
730 if (++message_size > thismessage_size_limit) return END_SIZE;
731 }
732
733/* Get here if EOF read. Unless we have just written "\n", we need to ensure
734the message ends with a newline, and we must also write any characters that
735were saved up while testing for an ending dot. */
736
737if (ch_state != 1)
738 {
739 static uschar *ends[] = { US"\n", NULL, US"\n", US".\n", US".\n" };
740 if (fputs(CS ends[ch_state], fout) == EOF) return END_WERROR;
741 message_size += Ustrlen(ends[ch_state]);
742 body_linecount++;
743 }
744
745return END_EOF;
746}
747
748
749
750
751/*************************************************
752* Read data portion of an SMTP message *
753*************************************************/
754
755/* This function is called to read the remainder of an SMTP message (after the
756headers), or to skip over it when an error has occurred. In this case, the
757output file is passed as NULL.
758
759If any line begins with a dot, that character is skipped. The input should only
760be successfully terminated by CR LF . CR LF unless it is local (non-network)
761SMTP, in which case the CRs are optional, but...
762
763FUDGE: It seems that sites on the net send out messages with just LF
764terminators, despite the warnings in the RFCs, and other MTAs handle this. So
765we make the CRs optional in all cases.
766
767July 2003: Bare CRs cause trouble. We now treat them as line terminators as
768well, so that there are no CRs in spooled messages. However, the message
769terminating dot is not recognized between two bare CRs.
770
771Arguments:
772 fout a FILE to which to write the message; NULL if skipping
773
774Returns: One of the END_xxx values indicating why it stopped reading
775*/
776
777static int
778read_message_data_smtp(FILE *fout)
779{
780int ch_state = 0;
e4bdf652 781int ch;
1f5497b2 782register int linelength = 0;
059ec3d9 783
80a47a2c 784while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
785 {
786 if (ch == 0) body_zerocount++;
787 switch (ch_state)
788 {
789 case 0: /* After LF or CRLF */
790 if (ch == '.')
791 {
792 ch_state = 3;
793 continue; /* Don't ever write . after LF */
794 }
795 ch_state = 1;
796
797 /* Else fall through to handle as normal uschar. */
798
799 case 1: /* Normal state */
800 if (ch == '\n')
801 {
802 ch_state = 0;
803 body_linecount++;
1f5497b2
PH
804 if (linelength > max_received_linelength)
805 max_received_linelength = linelength;
806 linelength = -1;
059ec3d9
PH
807 }
808 else if (ch == '\r')
809 {
810 ch_state = 2;
811 continue;
812 }
813 break;
814
815 case 2: /* After (unwritten) CR */
816 body_linecount++;
1f5497b2
PH
817 if (linelength > max_received_linelength)
818 max_received_linelength = linelength;
819 linelength = -1;
059ec3d9
PH
820 if (ch == '\n')
821 {
822 ch_state = 0;
823 }
824 else
825 {
826 message_size++;
827 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 828 (void) cutthrough_put_nl();
059ec3d9
PH
829 if (ch != '\r') ch_state = 1; else continue;
830 }
831 break;
832
833 case 3: /* After [CR] LF . */
834 if (ch == '\n')
835 return END_DOT;
836 if (ch == '\r')
837 {
838 ch_state = 4;
839 continue;
840 }
841 ch_state = 1; /* The dot itself is removed */
842 break;
843
844 case 4: /* After [CR] LF . CR */
845 if (ch == '\n') return END_DOT;
846 message_size++;
847 body_linecount++;
848 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 849 (void) cutthrough_put_nl();
059ec3d9
PH
850 if (ch == '\r')
851 {
852 ch_state = 2;
853 continue;
854 }
855 ch_state = 1;
856 break;
857 }
858
859 /* Add the character to the spool file, unless skipping; then loop for the
860 next. */
861
862 message_size++;
1f5497b2 863 linelength++;
059ec3d9
PH
864 if (fout != NULL)
865 {
866 if (fputc(ch, fout) == EOF) return END_WERROR;
867 if (message_size > thismessage_size_limit) return END_SIZE;
868 }
e4bdf652
JH
869 if(ch == '\n')
870 (void) cutthrough_put_nl();
871 else
872 {
873 uschar c= ch;
874 (void) cutthrough_puts(&c, 1);
875 }
059ec3d9
PH
876 }
877
878/* Fall through here if EOF encountered. This indicates some kind of error,
879since a correct message is terminated by [CR] LF . [CR] LF. */
880
881return END_EOF;
882}
883
884
885
886
887/*************************************************
888* Swallow SMTP message *
889*************************************************/
890
891/* This function is called when there has been some kind of error while reading
892an SMTP message, and the remaining data may need to be swallowed. It is global
893because it is called from smtp_closedown() to shut down an incoming call
894tidily.
895
896Argument: a FILE from which to read the message
897Returns: nothing
898*/
899
900void
901receive_swallow_smtp(void)
902{
903if (message_ended >= END_NOTENDED)
904 message_ended = read_message_data_smtp(NULL);
905}
906
907
908
909/*************************************************
910* Handle lost SMTP connection *
911*************************************************/
912
913/* This function logs connection loss incidents and generates an appropriate
914SMTP response.
915
916Argument: additional data for the message
917Returns: the SMTP response
918*/
919
920static uschar *
921handle_lost_connection(uschar *s)
922{
923log_write(L_lost_incoming_connection | L_smtp_connection, LOG_MAIN,
924 "%s lost while reading message data%s", smtp_get_connection_info(), s);
925return US"421 Lost incoming connection";
926}
927
928
929
930
931/*************************************************
932* Handle a non-smtp reception error *
933*************************************************/
934
935/* This function is called for various errors during the reception of non-SMTP
936messages. It either sends a message to the sender of the problem message, or it
937writes to the standard error stream.
938
939Arguments:
940 errcode code for moan_to_sender(), identifying the error
941 text1 first message text, passed to moan_to_sender()
942 text2 second message text, used only for stderrr
943 error_rc code to pass to exim_exit if no problem
944 f FILE containing body of message (may be stdin)
945 hptr pointer to instore headers or NULL
946
947Returns: calls exim_exit(), which does not return
948*/
949
950static void
951give_local_error(int errcode, uschar *text1, uschar *text2, int error_rc,
952 FILE *f, header_line *hptr)
953{
954if (error_handling == ERRORS_SENDER)
955 {
956 error_block eblock;
957 eblock.next = NULL;
958 eblock.text1 = text1;
959 if (!moan_to_sender(errcode, &eblock, hptr, f, FALSE))
960 error_rc = EXIT_FAILURE;
961 }
962else fprintf(stderr, "exim: %s%s\n", text2, text1); /* Sic */
f1e894f3 963(void)fclose(f);
059ec3d9
PH
964exim_exit(error_rc);
965}
966
967
968
969/*************************************************
970* Add header lines set up by ACL *
971*************************************************/
972
850635b6
PH
973/* This function is called to add the header lines that were set up by
974statements in an ACL to the list of headers in memory. It is done in two stages
975like this, because when the ACL for RCPT is running, the other headers have not
976yet been received. This function is called twice; once just before running the
977DATA ACL, and once after. This is so that header lines added by MAIL or RCPT
978are visible to the DATA ACL.
059ec3d9
PH
979
980Originally these header lines were added at the end. Now there is support for
981three different places: top, bottom, and after the Received: header(s). There
982will always be at least one Received: header, even if it is marked deleted, and
983even if something else has been put in front of it.
984
985Arguments:
986 acl_name text to identify which ACL
987
988Returns: nothing
989*/
990
991static void
578d43dc 992add_acl_headers(int where, uschar *acl_name)
059ec3d9
PH
993{
994header_line *h, *next;
995header_line *last_received = NULL;
e7568d51 996
578d43dc
JH
997switch(where)
998 {
999 case ACL_WHERE_DKIM:
1000 case ACL_WHERE_MIME:
af4a1bca
JH
1001 case ACL_WHERE_DATA:
1002 if (cutthrough_fd >= 0 && (acl_removed_headers || acl_added_headers))
578d43dc
JH
1003 {
1004 log_write(0, LOG_MAIN|LOG_PANIC, "Header modification in data ACLs"
af4a1bca 1005 " will not take effect on cutthrough deliveries");
578d43dc
JH
1006 return;
1007 }
1008 }
1009
e7568d51
TL
1010if (acl_removed_headers != NULL)
1011 {
1012 DEBUG(D_receive|D_acl) debug_printf(">>Headers removed by %s ACL:\n", acl_name);
1013
4a142059 1014 for (h = header_list; h != NULL; h = h->next) if (h->type != htype_old)
e7568d51 1015 {
4a142059 1016 uschar * list = acl_removed_headers;
e7568d51
TL
1017 int sep = ':'; /* This is specified as a colon-separated list */
1018 uschar *s;
1019 uschar buffer[128];
4a142059
JH
1020
1021 while ((s = string_nextinlist(&list, &sep, buffer, sizeof(buffer))))
1022 if (header_testname(h, s, Ustrlen(s), FALSE))
e7568d51
TL
1023 {
1024 h->type = htype_old;
1025 DEBUG(D_receive|D_acl) debug_printf(" %s", h->text);
1026 }
e7568d51
TL
1027 }
1028 acl_removed_headers = NULL;
1029 DEBUG(D_receive|D_acl) debug_printf(">>\n");
1030 }
059ec3d9 1031
71fafd95 1032if (acl_added_headers == NULL) return;
059ec3d9
PH
1033DEBUG(D_receive|D_acl) debug_printf(">>Headers added by %s ACL:\n", acl_name);
1034
71fafd95 1035for (h = acl_added_headers; h != NULL; h = next)
059ec3d9
PH
1036 {
1037 next = h->next;
1038
1039 switch(h->type)
1040 {
1041 case htype_add_top:
1042 h->next = header_list;
1043 header_list = h;
1044 DEBUG(D_receive|D_acl) debug_printf(" (at top)");
1045 break;
1046
1047 case htype_add_rec:
1048 if (last_received == NULL)
1049 {
1050 last_received = header_list;
1051 while (!header_testname(last_received, US"Received", 8, FALSE))
1052 last_received = last_received->next;
1053 while (last_received->next != NULL &&
1054 header_testname(last_received->next, US"Received", 8, FALSE))
1055 last_received = last_received->next;
1056 }
1057 h->next = last_received->next;
1058 last_received->next = h;
1059 DEBUG(D_receive|D_acl) debug_printf(" (after Received:)");
1060 break;
1061
8523533c
TK
1062 case htype_add_rfc:
1063 /* add header before any header which is NOT Received: or Resent- */
1064 last_received = header_list;
1065 while ( (last_received->next != NULL) &&
1066 ( (header_testname(last_received->next, US"Received", 8, FALSE)) ||
1067 (header_testname_incomplete(last_received->next, US"Resent-", 7, FALSE)) ) )
1068 last_received = last_received->next;
1069 /* last_received now points to the last Received: or Resent-* header
1070 in an uninterrupted chain of those header types (seen from the beginning
1071 of all headers. Our current header must follow it. */
1072 h->next = last_received->next;
1073 last_received->next = h;
8e669ac1 1074 DEBUG(D_receive|D_acl) debug_printf(" (before any non-Received: or Resent-*: header)");
8523533c
TK
1075 break;
1076
059ec3d9
PH
1077 default:
1078 h->next = NULL;
1079 header_last->next = h;
1080 break;
1081 }
1082
1083 if (h->next == NULL) header_last = h;
1084
1085 /* Check for one of the known header types (From:, To:, etc.) though in
1086 practice most added headers are going to be "other". Lower case
1087 identification letters are never stored with the header; they are used
1088 for existence tests when messages are received. So discard any lower case
1089 flag values. */
1090
1091 h->type = header_checkname(h, FALSE);
1092 if (h->type >= 'a') h->type = htype_other;
1093
1094 DEBUG(D_receive|D_acl) debug_printf(" %s", header_last->text);
1095 }
1096
71fafd95 1097acl_added_headers = NULL;
059ec3d9
PH
1098DEBUG(D_receive|D_acl) debug_printf(">>\n");
1099}
1100
1101
1102
1103/*************************************************
1104* Add host information for log line *
1105*************************************************/
1106
1107/* Called for acceptance and rejecting log lines. This adds information about
1108the calling host to a string that is being built dynamically.
1109
1110Arguments:
1111 s the dynamic string
1112 sizeptr points to the size variable
1113 ptrptr points to the pointer variable
1114
1115Returns: the extended string
1116*/
1117
1118static uschar *
1119add_host_info_for_log(uschar *s, int *sizeptr, int *ptrptr)
1120{
1121if (sender_fullhost != NULL)
1122 {
1123 s = string_append(s, sizeptr, ptrptr, 2, US" H=", sender_fullhost);
1124 if ((log_extra_selector & LX_incoming_interface) != 0 &&
1125 interface_address != NULL)
1126 {
1127 uschar *ss = string_sprintf(" I=[%s]:%d", interface_address,
1128 interface_port);
1129 s = string_cat(s, sizeptr, ptrptr, ss, Ustrlen(ss));
1130 }
1131 }
1132if (sender_ident != NULL)
1133 s = string_append(s, sizeptr, ptrptr, 2, US" U=", sender_ident);
1134if (received_protocol != NULL)
1135 s = string_append(s, sizeptr, ptrptr, 2, US" P=", received_protocol);
1136return s;
1137}
1138
1139
1140
63955bf2 1141#ifdef WITH_CONTENT_SCAN
059ec3d9 1142
54cdb463
PH
1143/*************************************************
1144* Run the MIME ACL on a message *
1145*************************************************/
1146
1147/* This code is in a subroutine so that it can be used for both SMTP
1148and non-SMTP messages. It is called with a non-NULL ACL pointer.
1149
1150Arguments:
1151 acl The ACL to run (acl_smtp_mime or acl_not_smtp_mime)
1152 smtp_yield_ptr Set FALSE to kill messages after dropped connection
1153 smtp_reply_ptr Where SMTP reply is being built
1154 blackholed_by_ptr Where "blackholed by" message is being built
1155
1156Returns: TRUE to carry on; FALSE to abandon the message
1157*/
1158
1159static BOOL
1160run_mime_acl(uschar *acl, BOOL *smtp_yield_ptr, uschar **smtp_reply_ptr,
1161 uschar **blackholed_by_ptr)
1162{
1163FILE *mbox_file;
1164uschar rfc822_file_path[2048];
1165unsigned long mbox_size;
1166header_line *my_headerlist;
1167uschar *user_msg, *log_msg;
1168int mime_part_count_buffer = -1;
7156b1ef 1169int rc = OK;
54cdb463
PH
1170
1171memset(CS rfc822_file_path,0,2048);
1172
1173/* check if it is a MIME message */
1174my_headerlist = header_list;
4e88a19f
PH
1175while (my_headerlist != NULL)
1176 {
54cdb463 1177 /* skip deleted headers */
4e88a19f
PH
1178 if (my_headerlist->type == '*')
1179 {
54cdb463
PH
1180 my_headerlist = my_headerlist->next;
1181 continue;
4e88a19f
PH
1182 }
1183 if (strncmpic(my_headerlist->text, US"Content-Type:", 13) == 0)
1184 {
54cdb463
PH
1185 DEBUG(D_receive) debug_printf("Found Content-Type: header - executing acl_smtp_mime.\n");
1186 goto DO_MIME_ACL;
4e88a19f 1187 }
54cdb463 1188 my_headerlist = my_headerlist->next;
4e88a19f 1189 }
54cdb463
PH
1190
1191DEBUG(D_receive) debug_printf("No Content-Type: header - presumably not a MIME message.\n");
1192return TRUE;
1193
1194DO_MIME_ACL:
1195/* make sure the eml mbox file is spooled up */
8544e77a 1196mbox_file = spool_mbox(&mbox_size, NULL);
54cdb463
PH
1197if (mbox_file == NULL) {
1198 /* error while spooling */
1199 log_write(0, LOG_MAIN|LOG_PANIC,
1200 "acl_smtp_mime: error while creating mbox spool file, message temporarily rejected.");
1201 Uunlink(spool_name);
1202 unspool_mbox();
6f0c431a
PP
1203#ifdef EXPERIMENTAL_DCC
1204 dcc_ok = 0;
1205#endif
a5bd321b 1206 smtp_respond(US"451", 3, TRUE, US"temporary local problem");
54cdb463
PH
1207 message_id[0] = 0; /* Indicate no message accepted */
1208 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1209 return FALSE; /* Indicate skip to end of receive function */
1210};
1211
1212mime_is_rfc822 = 0;
1213
1214MIME_ACL_CHECK:
1215mime_part_count = -1;
1216rc = mime_acl_check(acl, mbox_file, NULL, &user_msg, &log_msg);
f1e894f3 1217(void)fclose(mbox_file);
54cdb463 1218
4e88a19f
PH
1219if (Ustrlen(rfc822_file_path) > 0)
1220 {
54cdb463
PH
1221 mime_part_count = mime_part_count_buffer;
1222
4e88a19f
PH
1223 if (unlink(CS rfc822_file_path) == -1)
1224 {
54cdb463
PH
1225 log_write(0, LOG_PANIC,
1226 "acl_smtp_mime: can't unlink RFC822 spool file, skipping.");
1227 goto END_MIME_ACL;
4e88a19f
PH
1228 }
1229 }
54cdb463
PH
1230
1231/* check if we must check any message/rfc822 attachments */
4e88a19f
PH
1232if (rc == OK)
1233 {
54cdb463 1234 uschar temp_path[1024];
54cdb463
PH
1235 struct dirent *entry;
1236 DIR *tempdir;
1237
b07e6aa3
PH
1238 (void)string_format(temp_path, 1024, "%s/scan/%s", spool_directory,
1239 message_id);
54cdb463 1240
4e88a19f 1241 tempdir = opendir(CS temp_path);
4e88a19f
PH
1242 do
1243 {
1244 entry = readdir(tempdir);
1245 if (entry == NULL) break;
1246 if (strncmpic(US entry->d_name,US"__rfc822_",9) == 0)
1247 {
b07e6aa3 1248 (void)string_format(rfc822_file_path, 2048,"%s/scan/%s/%s", spool_directory, message_id, entry->d_name);
4e88a19f
PH
1249 debug_printf("RFC822 attachment detected: running MIME ACL for '%s'\n", rfc822_file_path);
1250 break;
1251 }
1252 } while (1);
1253 closedir(tempdir);
54cdb463 1254
4e88a19f
PH
1255 if (entry != NULL)
1256 {
c58b88df 1257 mbox_file = Ufopen(rfc822_file_path,"rb");
4e88a19f
PH
1258 if (mbox_file == NULL)
1259 {
54cdb463
PH
1260 log_write(0, LOG_PANIC,
1261 "acl_smtp_mime: can't open RFC822 spool file, skipping.");
1262 unlink(CS rfc822_file_path);
1263 goto END_MIME_ACL;
4e88a19f 1264 }
54cdb463
PH
1265 /* set RFC822 expansion variable */
1266 mime_is_rfc822 = 1;
1267 mime_part_count_buffer = mime_part_count;
1268 goto MIME_ACL_CHECK;
4e88a19f
PH
1269 }
1270 }
54cdb463
PH
1271
1272END_MIME_ACL:
578d43dc 1273add_acl_headers(ACL_WHERE_MIME, US"MIME");
54cdb463
PH
1274if (rc == DISCARD)
1275 {
1276 recipients_count = 0;
1277 *blackholed_by_ptr = US"MIME ACL";
1278 }
1279else if (rc != OK)
1280 {
1281 Uunlink(spool_name);
1282 unspool_mbox();
6f0c431a
PP
1283#ifdef EXPERIMENTAL_DCC
1284 dcc_ok = 0;
1285#endif
f4c1088b 1286 if (smtp_input && smtp_handle_acl_fail(ACL_WHERE_MIME, rc, user_msg, log_msg) != 0) {
54cdb463 1287 *smtp_yield_ptr = FALSE; /* No more messsages after dropped connection */
f4c1088b
PP
1288 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1289 }
54cdb463
PH
1290 message_id[0] = 0; /* Indicate no message accepted */
1291 return FALSE; /* Cause skip to end of receive function */
4e88a19f 1292 }
54cdb463
PH
1293
1294return TRUE;
1295}
1296
63955bf2 1297#endif /* WITH_CONTENT_SCAN */
54cdb463
PH
1298
1299
e4bdf652
JH
1300
1301void
1302received_header_gen(void)
1303{
1304uschar *received;
1305uschar *timestamp;
1306header_line *received_header= header_list;
1307
1308timestamp = expand_string(US"${tod_full}");
1309if (recipients_count == 1) received_for = recipients_list[0].address;
1310received = expand_string(received_header_text);
1311received_for = NULL;
1312
1313if (received == NULL)
1314 {
1315 if(spool_name[0] != 0)
1316 Uunlink(spool_name); /* Lose the data file */
1317 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Expansion of \"%s\" "
1318 "(received_header_text) failed: %s", string_printing(received_header_text),
1319 expand_string_message);
1320 }
1321
1322/* The first element on the header chain is reserved for the Received header,
1323so all we have to do is fill in the text pointer, and set the type. However, if
1324the result of the expansion is an empty string, we leave the header marked as
1325"old" so as to refrain from adding a Received header. */
1326
1327if (received[0] == 0)
1328 {
1329 received_header->text = string_sprintf("Received: ; %s\n", timestamp);
1330 received_header->type = htype_old;
1331 }
1332else
1333 {
1334 received_header->text = string_sprintf("%s; %s\n", received, timestamp);
1335 received_header->type = htype_received;
1336 }
1337
1338received_header->slen = Ustrlen(received_header->text);
1339
1340DEBUG(D_receive) debug_printf(">>Generated Received: header line\n%c %s",
1341 received_header->type, received_header->text);
1342}
1343
1344
1345
059ec3d9
PH
1346/*************************************************
1347* Receive message *
1348*************************************************/
1349
1350/* Receive a message on the given input, and put it into a pair of spool files.
1351Either a non-null list of recipients, or the extract flag will be true, or
1352both. The flag sender_local is true for locally generated messages. The flag
1353submission_mode is true if an ACL has obeyed "control = submission". The flag
8800895a 1354suppress_local_fixups is true if an ACL has obeyed "control =
f4ee74ac
PP
1355suppress_local_fixups" or -G was passed on the command-line.
1356The flag smtp_input is true if the message is to be
8800895a
PH
1357handled using SMTP conventions about termination and lines starting with dots.
1358For non-SMTP messages, dot_ends is true for dot-terminated messages.
059ec3d9
PH
1359
1360If a message was successfully read, message_id[0] will be non-zero.
1361
1362The general actions of this function are:
1363
1364 . Read the headers of the message (if any) into a chain of store
1365 blocks.
1366
1367 . If there is a "sender:" header and the message is locally originated,
69358f02
PH
1368 throw it away, unless the caller is trusted, or unless
1369 active_local_sender_retain is set - which can only happen if
1370 active_local_from_check is false.
059ec3d9
PH
1371
1372 . If recipients are to be extracted from the message, build the
1373 recipients list from the headers, removing any that were on the
1374 original recipients list (unless extract_addresses_remove_arguments is
1375 false), and at the same time, remove any bcc header that may be present.
1376
1377 . Get the spool file for the data, sort out its unique name, open
1378 and lock it (but don't give it the name yet).
1379
1380 . Generate a "Message-Id" header if the message doesn't have one, for
1381 locally-originated messages.
1382
1383 . Generate a "Received" header.
1384
1385 . Ensure the recipients list is fully qualified and rewritten if necessary.
1386
1387 . If there are any rewriting rules, apply them to the sender address
1388 and also to the headers.
1389
1390 . If there is no from: header, generate one, for locally-generated messages
1391 and messages in "submission mode" only.
1392
1393 . If the sender is local, check that from: is correct, and if not, generate
1394 a Sender: header, unless message comes from a trusted caller, or this
69358f02 1395 feature is disabled by active_local_from_check being false.
059ec3d9
PH
1396
1397 . If there is no "date" header, generate one, for locally-originated
1398 or submission mode messages only.
1399
1400 . Copy the rest of the input, or up to a terminating "." if in SMTP or
1401 dot_ends mode, to the data file. Leave it open, to hold the lock.
1402
1403 . Write the envelope and the headers to a new file.
1404
1405 . Set the name for the header file; close it.
1406
1407 . Set the name for the data file; close it.
1408
1409Because this function can potentially be called many times in a single
1410SMTP connection, all store should be got by store_get(), so that it will be
1411automatically retrieved after the message is accepted.
1412
1413FUDGE: It seems that sites on the net send out messages with just LF
1414terminators, despite the warnings in the RFCs, and other MTAs handle this. So
1415we make the CRs optional in all cases.
1416
1417July 2003: Bare CRs in messages, especially in header lines, cause trouble. A
1418new regime is now in place in which bare CRs in header lines are turned into LF
1419followed by a space, so as not to terminate the header line.
1420
1421February 2004: A bare LF in a header line in a message whose first line was
1422terminated by CRLF is treated in the same way as a bare CR.
1423
1424Arguments:
1425 extract_recip TRUE if recipients are to be extracted from the message's
1426 headers
1427
1428Returns: TRUE there are more messages to be read (SMTP input)
1429 FALSE there are no more messages to be read (non-SMTP input
1430 or SMTP connection collapsed, or other failure)
1431
1432When reading a message for filter testing, the returned value indicates
1433whether the headers (which is all that is read) were terminated by '.' or
1434not. */
1435
1436BOOL
1437receive_msg(BOOL extract_recip)
1438{
7156b1ef
NM
1439int i;
1440int rc = FAIL;
059ec3d9
PH
1441int msg_size = 0;
1442int process_info_len = Ustrlen(process_info);
1443int error_rc = (error_handling == ERRORS_SENDER)?
1444 errors_sender_rc : EXIT_FAILURE;
1445int header_size = 256;
1446int start, end, domain, size, sptr;
1447int id_resolution;
1448int had_zero = 0;
d677b2f2 1449int prevlines_length = 0;
059ec3d9
PH
1450
1451register int ptr = 0;
1452
1453BOOL contains_resent_headers = FALSE;
1454BOOL extracted_ignored = FALSE;
1455BOOL first_line_ended_crlf = TRUE_UNSET;
1456BOOL smtp_yield = TRUE;
1457BOOL yield = FALSE;
1458
1459BOOL resents_exist = FALSE;
1460uschar *resent_prefix = US"";
1461uschar *blackholed_by = NULL;
04f7d5b9 1462uschar *blackhole_log_msg = US"";
c5430c20 1463enum {NOT_TRIED, TMP_REJ, PERM_REJ, ACCEPTED} cutthrough_done = NOT_TRIED;
059ec3d9
PH
1464
1465flock_t lock_data;
1466error_block *bad_addresses = NULL;
1467
1468uschar *frozen_by = NULL;
1469uschar *queued_by = NULL;
1470
1471uschar *errmsg, *s;
1472struct stat statbuf;
1473
4e88a19f 1474/* Final message to give to SMTP caller, and messages from ACLs */
059ec3d9
PH
1475
1476uschar *smtp_reply = NULL;
4e88a19f 1477uschar *user_msg, *log_msg;
059ec3d9
PH
1478
1479/* Working header pointers */
1480
1481header_line *h, *next;
1482
2cbb4081 1483/* Flags for noting the existence of certain headers (only one left) */
059ec3d9
PH
1484
1485BOOL date_header_exists = FALSE;
1486
1487/* Pointers to receive the addresses of headers whose contents we need. */
1488
1489header_line *from_header = NULL;
1490header_line *subject_header = NULL;
1491header_line *msgid_header = NULL;
1492header_line *received_header;
1493
4840604e
TL
1494#ifdef EXPERIMENTAL_DMARC
1495int dmarc_up = 0;
1496#endif /* EXPERIMENTAL_DMARC */
1497
059ec3d9
PH
1498/* Variables for use when building the Received: header. */
1499
059ec3d9
PH
1500uschar *timestamp;
1501int tslen;
1502
1503/* Release any open files that might have been cached while preparing to
1504accept the message - e.g. by verifying addresses - because reading a message
1505might take a fair bit of real time. */
1506
1507search_tidyup();
1508
e4bdf652
JH
1509/* Extracting the recipient list from an input file is incompatible with
1510cutthrough delivery with the no-spool option. It shouldn't be possible
817d9f57 1511to set up the combination, but just in case kill any ongoing connection. */
e4bdf652 1512if (extract_recip || !smtp_input)
2e5b33cd 1513 cancel_cutthrough_connection("not smtp input");
e4bdf652 1514
059ec3d9
PH
1515/* Initialize the chain of headers by setting up a place-holder for Received:
1516header. Temporarily mark it as "old", i.e. not to be used. We keep header_last
1517pointing to the end of the chain to make adding headers simple. */
1518
1519received_header = header_list = header_last = store_get(sizeof(header_line));
1520header_list->next = NULL;
1521header_list->type = htype_old;
1522header_list->text = NULL;
1523header_list->slen = 0;
1524
1525/* Control block for the next header to be read. */
1526
1527next = store_get(sizeof(header_line));
1528next->text = store_get(header_size);
1529
1530/* Initialize message id to be null (indicating no message read), and the
1531header names list to be the normal list. Indicate there is no data file open
1532yet, initialize the size and warning count, and deal with no size limit. */
1533
1534message_id[0] = 0;
1535data_file = NULL;
1536data_fd = -1;
1537spool_name[0] = 0;
1538message_size = 0;
1539warning_count = 0;
d677b2f2 1540received_count = 1; /* For the one we will add */
059ec3d9
PH
1541
1542if (thismessage_size_limit <= 0) thismessage_size_limit = INT_MAX;
1543
2e0c1448 1544/* While reading the message, the following counts are computed. */
059ec3d9 1545
d677b2f2
PH
1546message_linecount = body_linecount = body_zerocount =
1547 max_received_linelength = 0;
059ec3d9 1548
80a47a2c
TK
1549#ifndef DISABLE_DKIM
1550/* Call into DKIM to set up the context. */
1551if (smtp_input && !smtp_batched_input && !dkim_disable_verify) dkim_exim_verify_init();
fb2274d4
TK
1552#endif
1553
4840604e
TL
1554#ifdef EXPERIMENTAL_DMARC
1555/* initialize libopendmarc */
1556dmarc_up = dmarc_init();
1557#endif
1558
059ec3d9
PH
1559/* Remember the time of reception. Exim uses time+pid for uniqueness of message
1560ids, and fractions of a second are required. See the comments that precede the
1561message id creation below. */
1562
1563(void)gettimeofday(&message_id_tv, NULL);
1564
1565/* For other uses of the received time we can operate with granularity of one
1566second, and for that we use the global variable received_time. This is for
1567things like ultimate message timeouts. */
1568
1569received_time = message_id_tv.tv_sec;
1570
1571/* If SMTP input, set the special handler for timeouts. The alarm() calls
1572happen in the smtp_getc() function when it refills its buffer. */
1573
1574if (smtp_input) os_non_restarting_signal(SIGALRM, data_timeout_handler);
1575
1576/* If not SMTP input, timeout happens only if configured, and we just set a
1577single timeout for the whole message. */
1578
1579else if (receive_timeout > 0)
1580 {
1581 os_non_restarting_signal(SIGALRM, data_timeout_handler);
1582 alarm(receive_timeout);
1583 }
1584
1585/* SIGTERM and SIGINT are caught always. */
1586
1587signal(SIGTERM, data_sigterm_sigint_handler);
1588signal(SIGINT, data_sigterm_sigint_handler);
1589
1590/* Header lines in messages are not supposed to be very long, though when
1591unfolded, to: and cc: headers can take up a lot of store. We must also cope
1592with the possibility of junk being thrown at us. Start by getting 256 bytes for
1593storing the header, and extend this as necessary using string_cat().
1594
1595To cope with total lunacies, impose an upper limit on the length of the header
1596section of the message, as otherwise the store will fill up. We must also cope
1597with the possibility of binary zeros in the data. Hence we cannot use fgets().
1598Folded header lines are joined into one string, leaving the '\n' characters
1599inside them, so that writing them out reproduces the input.
1600
1601Loop for each character of each header; the next structure for chaining the
1602header is set up already, with ptr the offset of the next character in
1603next->text. */
1604
1605for (;;)
1606 {
80a47a2c 1607 int ch = (receive_getc)();
059ec3d9
PH
1608
1609 /* If we hit EOF on a SMTP connection, it's an error, since incoming
1610 SMTP must have a correct "." terminator. */
1611
1612 if (ch == EOF && smtp_input /* && !smtp_batched_input */)
1613 {
1614 smtp_reply = handle_lost_connection(US" (header)");
1615 smtp_yield = FALSE;
1616 goto TIDYUP; /* Skip to end of function */
1617 }
1618
1619 /* See if we are at the current header's size limit - there must be at least
1620 four bytes left. This allows for the new character plus a zero, plus two for
1621 extra insertions when we are playing games with dots and carriage returns. If
1622 we are at the limit, extend the text buffer. This could have been done
1623 automatically using string_cat() but because this is a tightish loop storing
1624 only one character at a time, we choose to do it inline. Normally
1625 store_extend() will be able to extend the block; only at the end of a big
1626 store block will a copy be needed. To handle the case of very long headers
1627 (and sometimes lunatic messages can have ones that are 100s of K long) we
1628 call store_release() for strings that have been copied - if the string is at
1629 the start of a block (and therefore the only thing in it, because we aren't
1630 doing any other gets), the block gets freed. We can only do this because we
1631 know there are no other calls to store_get() going on. */
1632
1633 if (ptr >= header_size - 4)
1634 {
1635 int oldsize = header_size;
1636 /* header_size += 256; */
1637 header_size *= 2;
1638 if (!store_extend(next->text, oldsize, header_size))
1639 {
1640 uschar *newtext = store_get(header_size);
1641 memcpy(newtext, next->text, ptr);
1642 store_release(next->text);
1643 next->text = newtext;
1644 }
1645 }
1646
1647 /* Cope with receiving a binary zero. There is dispute about whether
1648 these should be allowed in RFC 822 messages. The middle view is that they
1649 should not be allowed in headers, at least. Exim takes this attitude at
1650 the moment. We can't just stomp on them here, because we don't know that
1651 this line is a header yet. Set a flag to cause scanning later. */
1652
1653 if (ch == 0) had_zero++;
1654
1655 /* Test for termination. Lines in remote SMTP are terminated by CRLF, while
1656 those from data files use just LF. Treat LF in local SMTP input as a
1657 terminator too. Treat EOF as a line terminator always. */
1658
1659 if (ch == EOF) goto EOL;
1660
1661 /* FUDGE: There are sites out there that don't send CRs before their LFs, and
1662 other MTAs accept this. We are therefore forced into this "liberalisation"
1663 too, so we accept LF as a line terminator whatever the source of the message.
1664 However, if the first line of the message ended with a CRLF, we treat a bare
1665 LF specially by inserting a white space after it to ensure that the header
1666 line is not terminated. */
1667
1668 if (ch == '\n')
1669 {
1670 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = FALSE;
80a47a2c 1671 else if (first_line_ended_crlf) receive_ungetc(' ');
059ec3d9
PH
1672 goto EOL;
1673 }
1674
1675 /* This is not the end of the line. If this is SMTP input and this is
1676 the first character in the line and it is a "." character, ignore it.
1677 This implements the dot-doubling rule, though header lines starting with
1678 dots aren't exactly common. They are legal in RFC 822, though. If the
1679 following is CRLF or LF, this is the line that that terminates the
1680 entire message. We set message_ended to indicate this has happened (to
1681 prevent further reading), and break out of the loop, having freed the
1682 empty header, and set next = NULL to indicate no data line. */
1683
1684 if (ptr == 0 && ch == '.' && (smtp_input || dot_ends))
1685 {
80a47a2c 1686 ch = (receive_getc)();
059ec3d9
PH
1687 if (ch == '\r')
1688 {
80a47a2c 1689 ch = (receive_getc)();
059ec3d9
PH
1690 if (ch != '\n')
1691 {
80a47a2c 1692 receive_ungetc(ch);
059ec3d9
PH
1693 ch = '\r'; /* Revert to CR */
1694 }
1695 }
1696 if (ch == '\n')
1697 {
1698 message_ended = END_DOT;
1699 store_reset(next);
1700 next = NULL;
1701 break; /* End character-reading loop */
1702 }
1703
1704 /* For non-SMTP input, the dot at the start of the line was really a data
1705 character. What is now in ch is the following character. We guaranteed
1706 enough space for this above. */
1707
1708 if (!smtp_input)
1709 {
1710 next->text[ptr++] = '.';
1711 message_size++;
1712 }
1713 }
1714
1715 /* If CR is immediately followed by LF, end the line, ignoring the CR, and
1716 remember this case if this is the first line ending. */
1717
1718 if (ch == '\r')
1719 {
80a47a2c 1720 ch = (receive_getc)();
059ec3d9
PH
1721 if (ch == '\n')
1722 {
1723 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = TRUE;
1724 goto EOL;
1725 }
1726
1727 /* Otherwise, put back the character after CR, and turn the bare CR
1728 into LF SP. */
1729
80a47a2c 1730 ch = (receive_ungetc)(ch);
059ec3d9
PH
1731 next->text[ptr++] = '\n';
1732 message_size++;
1733 ch = ' ';
1734 }
1735
1736 /* We have a data character for the header line. */
1737
1738 next->text[ptr++] = ch; /* Add to buffer */
1739 message_size++; /* Total message size so far */
1740
1741 /* Handle failure due to a humungously long header section. The >= allows
1742 for the terminating \n. Add what we have so far onto the headers list so
1743 that it gets reflected in any error message, and back up the just-read
1744 character. */
1745
1746 if (message_size >= header_maxsize)
1747 {
1748 next->text[ptr] = 0;
1749 next->slen = ptr;
1750 next->type = htype_other;
1751 next->next = NULL;
1752 header_last->next = next;
1753 header_last = next;
1754
1755 log_write(0, LOG_MAIN, "ridiculously long message header received from "
1756 "%s (more than %d characters): message abandoned",
1757 sender_host_unknown? sender_ident : sender_fullhost, header_maxsize);
1758
1759 if (smtp_input)
1760 {
1761 smtp_reply = US"552 Message header is ridiculously long";
1762 receive_swallow_smtp();
1763 goto TIDYUP; /* Skip to end of function */
1764 }
1765
1766 else
1767 {
1768 give_local_error(ERRMESS_VLONGHEADER,
1769 string_sprintf("message header longer than %d characters received: "
1770 "message not accepted", header_maxsize), US"", error_rc, stdin,
1771 header_list->next);
1772 /* Does not return */
1773 }
1774 }
1775
1776 continue; /* With next input character */
1777
1778 /* End of header line reached */
1779
1780 EOL:
2e0c1448
PH
1781
1782 /* Keep track of lines for BSMTP errors and overall message_linecount. */
1783
1784 receive_linecount++;
1785 message_linecount++;
059ec3d9 1786
d677b2f2
PH
1787 /* Keep track of maximum line length */
1788
1789 if (ptr - prevlines_length > max_received_linelength)
1790 max_received_linelength = ptr - prevlines_length;
1791 prevlines_length = ptr + 1;
1792
059ec3d9
PH
1793 /* Now put in the terminating newline. There is always space for
1794 at least two more characters. */
1795
1796 next->text[ptr++] = '\n';
1797 message_size++;
1798
1799 /* A blank line signals the end of the headers; release the unwanted
1800 space and set next to NULL to indicate this. */
1801
1802 if (ptr == 1)
1803 {
1804 store_reset(next);
1805 next = NULL;
1806 break;
1807 }
1808
1809 /* There is data in the line; see if the next input character is a
1810 whitespace character. If it is, we have a continuation of this header line.
1811 There is always space for at least one character at this point. */
1812
1813 if (ch != EOF)
1814 {
80a47a2c 1815 int nextch = (receive_getc)();
059ec3d9
PH
1816 if (nextch == ' ' || nextch == '\t')
1817 {
1818 next->text[ptr++] = nextch;
1819 message_size++;
1820 continue; /* Iterate the loop */
1821 }
80a47a2c 1822 else if (nextch != EOF) (receive_ungetc)(nextch); /* For next time */
059ec3d9
PH
1823 else ch = EOF; /* Cause main loop to exit at end */
1824 }
1825
1826 /* We have got to the real line end. Terminate the string and release store
1827 beyond it. If it turns out to be a real header, internal binary zeros will
1828 be squashed later. */
1829
1830 next->text[ptr] = 0;
1831 next->slen = ptr;
1832 store_reset(next->text + ptr + 1);
1833
1834 /* Check the running total size against the overall message size limit. We
1835 don't expect to fail here, but if the overall limit is set less than MESSAGE_
1836 MAXSIZE and a big header is sent, we want to catch it. Just stop reading
1837 headers - the code to read the body will then also hit the buffer. */
1838
1839 if (message_size > thismessage_size_limit) break;
1840
1841 /* A line that is not syntactically correct for a header also marks
1842 the end of the headers. In this case, we leave next containing the
1843 first data line. This might actually be several lines because of the
1844 continuation logic applied above, but that doesn't matter.
1845
1846 It turns out that smail, and presumably sendmail, accept leading lines
1847 of the form
1848
1849 From ph10 Fri Jan 5 12:35 GMT 1996
1850
1851 in messages. The "mail" command on Solaris 2 sends such lines. I cannot
1852 find any documentation of this, but for compatibility it had better be
1853 accepted. Exim restricts it to the case of non-smtp messages, and
1854 treats it as an alternative to the -f command line option. Thus it is
1855 ignored except for trusted users or filter testing. Otherwise it is taken
1856 as the sender address, unless -f was used (sendmail compatibility).
1857
1858 It further turns out that some UUCPs generate the From_line in a different
1859 format, e.g.
1860
1861 From ph10 Fri, 7 Jan 97 14:00:00 GMT
1862
1863 The regex for matching these things is now capable of recognizing both
1864 formats (including 2- and 4-digit years in the latter). In fact, the regex
1865 is now configurable, as is the expansion string to fish out the sender.
1866
1867 Even further on it has been discovered that some broken clients send
1868 these lines in SMTP messages. There is now an option to ignore them from
1869 specified hosts or networks. Sigh. */
1870
1871 if (header_last == header_list &&
1872 (!smtp_input
1873 ||
1874 (sender_host_address != NULL &&
1875 verify_check_host(&ignore_fromline_hosts) == OK)
1876 ||
1877 (sender_host_address == NULL && ignore_fromline_local)
1878 ) &&
1879 regex_match_and_setup(regex_From, next->text, 0, -1))
1880 {
1881 if (!sender_address_forced)
1882 {
1883 uschar *uucp_sender = expand_string(uucp_from_sender);
1884 if (uucp_sender == NULL)
1885 {
1886 log_write(0, LOG_MAIN|LOG_PANIC,
1887 "expansion of \"%s\" failed after matching "
1888 "\"From \" line: %s", uucp_from_sender, expand_string_message);
1889 }
1890 else
1891 {
1892 int start, end, domain;
1893 uschar *errmess;
1894 uschar *newsender = parse_extract_address(uucp_sender, &errmess,
1895 &start, &end, &domain, TRUE);
1896 if (newsender != NULL)
1897 {
1898 if (domain == 0 && newsender[0] != 0)
1899 newsender = rewrite_address_qualify(newsender, FALSE);
1900
f05da2e8 1901 if (filter_test != FTEST_NONE || receive_check_set_sender(newsender))
059ec3d9
PH
1902 {
1903 sender_address = newsender;
1904
f05da2e8 1905 if (trusted_caller || filter_test != FTEST_NONE)
059ec3d9
PH
1906 {
1907 authenticated_sender = NULL;
1908 originator_name = US"";
1909 sender_local = FALSE;
1910 }
1911
f05da2e8 1912 if (filter_test != FTEST_NONE)
059ec3d9
PH
1913 printf("Sender taken from \"From \" line\n");
1914 }
1915 }
1916 }
1917 }
1918 }
1919
1920 /* Not a leading "From " line. Check to see if it is a valid header line.
1921 Header names may contain any non-control characters except space and colon,
1922 amazingly. */
1923
1924 else
1925 {
1926 uschar *p = next->text;
1927
1928 /* If not a valid header line, break from the header reading loop, leaving
1929 next != NULL, indicating that it holds the first line of the body. */
1930
1931 if (isspace(*p)) break;
1932 while (mac_isgraph(*p) && *p != ':') p++;
1933 while (isspace(*p)) p++;
1934 if (*p != ':')
1935 {
1936 body_zerocount = had_zero;
1937 break;
1938 }
1939
1940 /* We have a valid header line. If there were any binary zeroes in
1941 the line, stomp on them here. */
1942
1943 if (had_zero > 0)
1944 for (p = next->text; p < next->text + ptr; p++) if (*p == 0) *p = '?';
1945
1946 /* It is perfectly legal to have an empty continuation line
1947 at the end of a header, but it is confusing to humans
1948 looking at such messages, since it looks like a blank line.
1949 Reduce confusion by removing redundant white space at the
1950 end. We know that there is at least one printing character
1951 (the ':' tested for above) so there is no danger of running
1952 off the end. */
1953
1954 p = next->text + ptr - 2;
1955 for (;;)
1956 {
1957 while (*p == ' ' || *p == '\t') p--;
1958 if (*p != '\n') break;
1959 ptr = (p--) - next->text + 1;
1960 message_size -= next->slen - ptr;
1961 next->text[ptr] = 0;
1962 next->slen = ptr;
1963 }
1964
1965 /* Add the header to the chain */
1966
1967 next->type = htype_other;
1968 next->next = NULL;
1969 header_last->next = next;
1970 header_last = next;
1971
1972 /* Check the limit for individual line lengths. This comes after adding to
1973 the chain so that the failing line is reflected if a bounce is generated
1974 (for a local message). */
1975
1976 if (header_line_maxsize > 0 && next->slen > header_line_maxsize)
1977 {
1978 log_write(0, LOG_MAIN, "overlong message header line received from "
1979 "%s (more than %d characters): message abandoned",
1980 sender_host_unknown? sender_ident : sender_fullhost,
1981 header_line_maxsize);
1982
1983 if (smtp_input)
1984 {
1985 smtp_reply = US"552 A message header line is too long";
1986 receive_swallow_smtp();
1987 goto TIDYUP; /* Skip to end of function */
1988 }
1989
1990 else
1991 {
1992 give_local_error(ERRMESS_VLONGHDRLINE,
1993 string_sprintf("message header line longer than %d characters "
1994 "received: message not accepted", header_line_maxsize), US"",
1995 error_rc, stdin, header_list->next);
1996 /* Does not return */
1997 }
1998 }
1999
2000 /* Note if any resent- fields exist. */
2001
2002 if (!resents_exist && strncmpic(next->text, US"resent-", 7) == 0)
2003 {
2004 resents_exist = TRUE;
2005 resent_prefix = US"Resent-";
2006 }
2007 }
2008
2009 /* The line has been handled. If we have hit EOF, break out of the loop,
2010 indicating no pending data line. */
2011
2012 if (ch == EOF) { next = NULL; break; }
2013
2014 /* Set up for the next header */
2015
2016 header_size = 256;
2017 next = store_get(sizeof(header_line));
2018 next->text = store_get(header_size);
2019 ptr = 0;
2020 had_zero = 0;
d677b2f2 2021 prevlines_length = 0;
059ec3d9
PH
2022 } /* Continue, starting to read the next header */
2023
2024/* At this point, we have read all the headers into a data structure in main
2025store. The first header is still the dummy placeholder for the Received: header
2026we are going to generate a bit later on. If next != NULL, it contains the first
2027data line - which terminated the headers before reaching a blank line (not the
2028normal case). */
2029
2030DEBUG(D_receive)
2031 {
2032 debug_printf(">>Headers received:\n");
2033 for (h = header_list->next; h != NULL; h = h->next)
2034 debug_printf("%s", h->text);
2035 debug_printf("\n");
2036 }
2037
2038/* End of file on any SMTP connection is an error. If an incoming SMTP call
2039is dropped immediately after valid headers, the next thing we will see is EOF.
2040We must test for this specially, as further down the reading of the data is
2041skipped if already at EOF. */
2042
2043if (smtp_input && (receive_feof)())
2044 {
2045 smtp_reply = handle_lost_connection(US" (after header)");
2046 smtp_yield = FALSE;
2047 goto TIDYUP; /* Skip to end of function */
2048 }
2049
2050/* If this is a filter test run and no headers were read, output a warning
2051in case there is a mistake in the test message. */
2052
f05da2e8 2053if (filter_test != FTEST_NONE && header_list->next == NULL)
059ec3d9
PH
2054 printf("Warning: no message headers read\n");
2055
2056
2057/* Scan the headers to identify them. Some are merely marked for later
2058processing; some are dealt with here. */
2059
2060for (h = header_list->next; h != NULL; h = h->next)
2061 {
2062 BOOL is_resent = strncmpic(h->text, US"resent-", 7) == 0;
2063 if (is_resent) contains_resent_headers = TRUE;
2064
2065 switch (header_checkname(h, is_resent))
2066 {
059ec3d9 2067 case htype_bcc:
2cbb4081 2068 h->type = htype_bcc; /* Both Bcc: and Resent-Bcc: */
059ec3d9
PH
2069 break;
2070
059ec3d9 2071 case htype_cc:
2cbb4081 2072 h->type = htype_cc; /* Both Cc: and Resent-Cc: */
059ec3d9
PH
2073 break;
2074
2075 /* Record whether a Date: or Resent-Date: header exists, as appropriate. */
2076
2077 case htype_date:
4c69d561 2078 if (!resents_exist || is_resent) date_header_exists = TRUE;
059ec3d9
PH
2079 break;
2080
2081 /* Same comments as about Return-Path: below. */
2082
2083 case htype_delivery_date:
2084 if (delivery_date_remove) h->type = htype_old;
2085 break;
2086
2087 /* Same comments as about Return-Path: below. */
2088
2089 case htype_envelope_to:
2090 if (envelope_to_remove) h->type = htype_old;
2091 break;
2092
2093 /* Mark all "From:" headers so they get rewritten. Save the one that is to
2094 be used for Sender: checking. For Sendmail compatibility, if the "From:"
2095 header consists of just the login id of the user who called Exim, rewrite
2096 it with the gecos field first. Apply this rule to Resent-From: if there
2097 are resent- fields. */
2098
2099 case htype_from:
2100 h->type = htype_from;
2101 if (!resents_exist || is_resent)
2102 {
2103 from_header = h;
2104 if (!smtp_input)
2105 {
5de8faa3 2106 int len;
059ec3d9
PH
2107 uschar *s = Ustrchr(h->text, ':') + 1;
2108 while (isspace(*s)) s++;
5de8faa3 2109 len = h->slen - (s - h->text) - 1;
e0fccd1d
TF
2110 if (Ustrlen(originator_login) == len &&
2111 strncmpic(s, originator_login, len) == 0)
059ec3d9
PH
2112 {
2113 uschar *name = is_resent? US"Resent-From" : US"From";
2114 header_add(htype_from, "%s: %s <%s@%s>\n", name, originator_name,
2115 originator_login, qualify_domain_sender);
2116 from_header = header_last;
2117 h->type = htype_old;
2118 DEBUG(D_receive|D_rewrite)
2119 debug_printf("rewrote \"%s:\" header using gecos\n", name);
2120 }
2121 }
2122 }
2123 break;
2124
2125 /* Identify the Message-id: header for generating "in-reply-to" in the
2126 autoreply transport. For incoming logging, save any resent- value. In both
2127 cases, take just the first of any multiples. */
2128
2129 case htype_id:
2130 if (msgid_header == NULL && (!resents_exist || is_resent))
2131 {
2132 msgid_header = h;
2133 h->type = htype_id;
2134 }
2135 break;
2136
2137 /* Flag all Received: headers */
2138
2139 case htype_received:
2140 h->type = htype_received;
2141 received_count++;
2142 break;
2143
2144 /* "Reply-to:" is just noted (there is no resent-reply-to field) */
2145
2146 case htype_reply_to:
2147 h->type = htype_reply_to;
2148 break;
2149
2150 /* The Return-path: header is supposed to be added to messages when
2151 they leave the SMTP system. We shouldn't receive messages that already
2152 contain Return-path. However, since Exim generates Return-path: on
2153 local delivery, resent messages may well contain it. We therefore
2154 provide an option (which defaults on) to remove any Return-path: headers
2155 on input. Removal actually means flagging as "old", which prevents the
2156 header being transmitted with the message. */
2157
2158 case htype_return_path:
2159 if (return_path_remove) h->type = htype_old;
2160
2161 /* If we are testing a mail filter file, use the value of the
2162 Return-Path: header to set up the return_path variable, which is not
2163 otherwise set. However, remove any <> that surround the address
2164 because the variable doesn't have these. */
2165
f05da2e8 2166 if (filter_test != FTEST_NONE)
059ec3d9
PH
2167 {
2168 uschar *start = h->text + 12;
2169 uschar *end = start + Ustrlen(start);
2170 while (isspace(*start)) start++;
2171 while (end > start && isspace(end[-1])) end--;
2172 if (*start == '<' && end[-1] == '>')
2173 {
2174 start++;
2175 end--;
2176 }
2177 return_path = string_copyn(start, end - start);
2178 printf("Return-path taken from \"Return-path:\" header line\n");
2179 }
2180 break;
2181
2182 /* If there is a "Sender:" header and the message is locally originated,
8800895a
PH
2183 and from an untrusted caller and suppress_local_fixups is not set, or if we
2184 are in submission mode for a remote message, mark it "old" so that it will
2185 not be transmitted with the message, unless active_local_sender_retain is
2186 set. (This can only be true if active_local_from_check is false.) If there
2187 are any resent- headers in the message, apply this rule to Resent-Sender:
2188 instead of Sender:. Messages with multiple resent- header sets cannot be
2189 tidily handled. (For this reason, at least one MUA - Pine - turns old
2190 resent- headers into X-resent- headers when resending, leaving just one
2191 set.) */
059ec3d9
PH
2192
2193 case htype_sender:
69358f02 2194 h->type = ((!active_local_sender_retain &&
8800895a
PH
2195 (
2196 (sender_local && !trusted_caller && !suppress_local_fixups)
2197 || submission_mode
2198 )
059ec3d9
PH
2199 ) &&
2200 (!resents_exist||is_resent))?
2201 htype_old : htype_sender;
2202 break;
2203
2204 /* Remember the Subject: header for logging. There is no Resent-Subject */
2205
2206 case htype_subject:
2207 subject_header = h;
2208 break;
2209
2210 /* "To:" gets flagged, and the existence of a recipient header is noted,
2211 whether it's resent- or not. */
2212
2213 case htype_to:
2214 h->type = htype_to;
2215 /****
2216 to_or_cc_header_exists = TRUE;
2217 ****/
2218 break;
2219 }
2220 }
2221
2222/* Extract recipients from the headers if that is required (the -t option).
2223Note that this is documented as being done *before* any address rewriting takes
2224place. There are two possibilities:
2225
2226(1) According to sendmail documentation for Solaris, IRIX, and HP-UX, any
2227recipients already listed are to be REMOVED from the message. Smail 3 works
2228like this. We need to build a non-recipients tree for that list, because in
2229subsequent processing this data is held in a tree and that's what the
2230spool_write_header() function expects. Make sure that non-recipient addresses
2231are fully qualified and rewritten if necessary.
2232
2233(2) According to other sendmail documentation, -t ADDS extracted recipients to
2234those in the command line arguments (and it is rumoured some other MTAs do
2235this). Therefore, there is an option to make Exim behave this way.
2236
2237*** Notes on "Resent-" header lines ***
2238
2239The presence of resent-headers in the message makes -t horribly ambiguous.
2240Experiments with sendmail showed that it uses recipients for all resent-
2241headers, totally ignoring the concept of "sets of resent- headers" as described
2242in RFC 2822 section 3.6.6. Sendmail also amalgamates them into a single set
2243with all the addresses in one instance of each header.
2244
2245This seems to me not to be at all sensible. Before release 4.20, Exim 4 gave an
2246error for -t if there were resent- headers in the message. However, after a
2247discussion on the mailing list, I've learned that there are MUAs that use
2248resent- headers with -t, and also that the stuff about sets of resent- headers
2249and their ordering in RFC 2822 is generally ignored. An MUA that submits a
2250message with -t and resent- header lines makes sure that only *its* resent-
2251headers are present; previous ones are often renamed as X-resent- for example.
2252
2253Consequently, Exim has been changed so that, if any resent- header lines are
2254present, the recipients are taken from all of the appropriate resent- lines,
2255and not from the ordinary To:, Cc:, etc. */
2256
2257if (extract_recip)
2258 {
2259 int rcount = 0;
2260 error_block **bnext = &bad_addresses;
2261
2262 if (extract_addresses_remove_arguments)
2263 {
2264 while (recipients_count-- > 0)
2265 {
2266 uschar *s = rewrite_address(recipients_list[recipients_count].address,
2267 TRUE, TRUE, global_rewrite_rules, rewrite_existflags);
2268 tree_add_nonrecipient(s);
2269 }
2270 recipients_list = NULL;
2271 recipients_count = recipients_list_max = 0;
2272 }
2273
059ec3d9
PH
2274 /* Now scan the headers */
2275
2276 for (h = header_list->next; h != NULL; h = h->next)
2277 {
2278 if ((h->type == htype_to || h->type == htype_cc || h->type == htype_bcc) &&
2279 (!contains_resent_headers || strncmpic(h->text, US"resent-", 7) == 0))
2280 {
2281 uschar *s = Ustrchr(h->text, ':') + 1;
2282 while (isspace(*s)) s++;
2283
1eccaa59
PH
2284 parse_allow_group = TRUE; /* Allow address group syntax */
2285
059ec3d9
PH
2286 while (*s != 0)
2287 {
2288 uschar *ss = parse_find_address_end(s, FALSE);
2289 uschar *recipient, *errmess, *p, *pp;
2290 int start, end, domain;
2291
2292 /* Check on maximum */
2293
2294 if (recipients_max > 0 && ++rcount > recipients_max)
2295 {
2296 give_local_error(ERRMESS_TOOMANYRECIP, US"too many recipients",
2297 US"message rejected: ", error_rc, stdin, NULL);
2298 /* Does not return */
2299 }
2300
2301 /* Make a copy of the address, and remove any internal newlines. These
2302 may be present as a result of continuations of the header line. The
2303 white space that follows the newline must not be removed - it is part
2304 of the header. */
2305
2306 pp = recipient = store_get(ss - s + 1);
2307 for (p = s; p < ss; p++) if (*p != '\n') *pp++ = *p;
2308 *pp = 0;
2309 recipient = parse_extract_address(recipient, &errmess, &start, &end,
2310 &domain, FALSE);
2311
2312 /* Keep a list of all the bad addresses so we can send a single
2313 error message at the end. However, an empty address is not an error;
2314 just ignore it. This can come from an empty group list like
2315
2316 To: Recipients of list:;
2317
2318 If there are no recipients at all, an error will occur later. */
2319
2320 if (recipient == NULL && Ustrcmp(errmess, "empty address") != 0)
2321 {
2322 int len = Ustrlen(s);
2323 error_block *b = store_get(sizeof(error_block));
2324 while (len > 0 && isspace(s[len-1])) len--;
2325 b->next = NULL;
2326 b->text1 = string_printing(string_copyn(s, len));
2327 b->text2 = errmess;
2328 *bnext = b;
2329 bnext = &(b->next);
2330 }
2331
2332 /* If the recipient is already in the nonrecipients tree, it must
2333 have appeared on the command line with the option extract_addresses_
2334 remove_arguments set. Do not add it to the recipients, and keep a note
2335 that this has happened, in order to give a better error if there are
2336 no recipients left. */
2337
2338 else if (recipient != NULL)
2339 {
2340 if (tree_search(tree_nonrecipients, recipient) == NULL)
2341 receive_add_recipient(recipient, -1);
2342 else
2343 extracted_ignored = TRUE;
2344 }
2345
2346 /* Move on past this address */
2347
2348 s = ss + (*ss? 1:0);
2349 while (isspace(*s)) s++;
1eccaa59
PH
2350 } /* Next address */
2351
2352 parse_allow_group = FALSE; /* Reset group syntax flags */
2353 parse_found_group = FALSE;
059ec3d9
PH
2354
2355 /* If this was the bcc: header, mark it "old", which means it
2356 will be kept on the spool, but not transmitted as part of the
2357 message. */
2358
2cbb4081 2359 if (h->type == htype_bcc) h->type = htype_old;
059ec3d9
PH
2360 } /* For appropriate header line */
2361 } /* For each header line */
2362
059ec3d9
PH
2363 }
2364
2365/* Now build the unique message id. This has changed several times over the
2366lifetime of Exim. This description was rewritten for Exim 4.14 (February 2003).
2367Retaining all the history in the comment has become too unwieldy - read
2368previous release sources if you want it.
2369
2370The message ID has 3 parts: tttttt-pppppp-ss. Each part is a number in base 62.
2371The first part is the current time, in seconds. The second part is the current
2372pid. Both are large enough to hold 32-bit numbers in base 62. The third part
2373can hold a number in the range 0-3843. It used to be a computed sequence
2374number, but is now the fractional component of the current time in units of
23751/2000 of a second (i.e. a value in the range 0-1999). After a message has been
2376received, Exim ensures that the timer has ticked at the appropriate level
2377before proceeding, to avoid duplication if the pid happened to be re-used
2378within the same time period. It seems likely that most messages will take at
2379least half a millisecond to be received, so no delay will normally be
2380necessary. At least for some time...
2381
2382There is a modification when localhost_number is set. Formerly this was allowed
2383to be as large as 255. Now it is restricted to the range 0-16, and the final
2384component of the message id becomes (localhost_number * 200) + fractional time
2385in units of 1/200 of a second (i.e. a value in the range 0-3399).
2386
2387Some not-really-Unix operating systems use case-insensitive file names (Darwin,
2388Cygwin). For these, we have to use base 36 instead of base 62. Luckily, this
2389still allows the tttttt field to hold a large enough number to last for some
2390more decades, and the final two-digit field can hold numbers up to 1295, which
2391is enough for milliseconds (instead of 1/2000 of a second).
2392
2393However, the pppppp field cannot hold a 32-bit pid, but it can hold a 31-bit
2394pid, so it is probably safe because pids have to be positive. The
2395localhost_number is restricted to 0-10 for these hosts, and when it is set, the
2396final field becomes (localhost_number * 100) + fractional time in centiseconds.
2397
2398Note that string_base62() returns its data in a static storage block, so it
2399must be copied before calling string_base62() again. It always returns exactly
24006 characters.
2401
2402There doesn't seem to be anything in the RFC which requires a message id to
2403start with a letter, but Smail was changed to ensure this. The external form of
2404the message id (as supplied by string expansion) therefore starts with an
2405additional leading 'E'. The spool file names do not include this leading
2406letter and it is not used internally.
2407
2408NOTE: If ever the format of message ids is changed, the regular expression for
2409checking that a string is in this format must be updated in a corresponding
2410way. It appears in the initializing code in exim.c. The macro MESSAGE_ID_LENGTH
2411must also be changed to reflect the correct string length. Then, of course,
2412other programs that rely on the message id format will need updating too. */
2413
2414Ustrncpy(message_id, string_base62((long int)(message_id_tv.tv_sec)), 6);
2415message_id[6] = '-';
2416Ustrncpy(message_id + 7, string_base62((long int)getpid()), 6);
2417
2418/* Deal with the case where the host number is set. The value of the number was
2419checked when it was read, to ensure it isn't too big. The timing granularity is
2420left in id_resolution so that an appropriate wait can be done after receiving
2421the message, if necessary (we hope it won't be). */
2422
2423if (host_number_string != NULL)
2424 {
2425 id_resolution = (BASE_62 == 62)? 5000 : 10000;
2426 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2427 string_base62((long int)(
2428 host_number * (1000000/id_resolution) +
2429 message_id_tv.tv_usec/id_resolution)) + 4);
2430 }
2431
2432/* Host number not set: final field is just the fractional time at an
2433appropriate resolution. */
2434
2435else
2436 {
2437 id_resolution = (BASE_62 == 62)? 500 : 1000;
2438 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2439 string_base62((long int)(message_id_tv.tv_usec/id_resolution)) + 4);
2440 }
2441
2442/* Add the current message id onto the current process info string if
2443it will fit. */
2444
2445(void)string_format(process_info + process_info_len,
2446 PROCESS_INFO_SIZE - process_info_len, " id=%s", message_id);
2447
2448/* If we are using multiple input directories, set up the one for this message
2449to be the least significant base-62 digit of the time of arrival. Otherwise
2450ensure that it is an empty string. */
2451
2452message_subdir[0] = split_spool_directory? message_id[5] : 0;
2453
2454/* Now that we have the message-id, if there is no message-id: header, generate
8800895a
PH
2455one, but only for local (without suppress_local_fixups) or submission mode
2456messages. This can be user-configured if required, but we had better flatten
2457any illegal characters therein. */
059ec3d9 2458
8800895a
PH
2459if (msgid_header == NULL &&
2460 ((sender_host_address == NULL && !suppress_local_fixups)
2461 || submission_mode))
059ec3d9
PH
2462 {
2463 uschar *p;
2464 uschar *id_text = US"";
2465 uschar *id_domain = primary_hostname;
2466
2467 /* Permit only letters, digits, dots, and hyphens in the domain */
2468
2469 if (message_id_domain != NULL)
2470 {
2471 uschar *new_id_domain = expand_string(message_id_domain);
2472 if (new_id_domain == NULL)
2473 {
2474 if (!expand_string_forcedfail)
2475 log_write(0, LOG_MAIN|LOG_PANIC,
2476 "expansion of \"%s\" (message_id_header_domain) "
2477 "failed: %s", message_id_domain, expand_string_message);
2478 }
2479 else if (*new_id_domain != 0)
2480 {
2481 id_domain = new_id_domain;
2482 for (p = id_domain; *p != 0; p++)
2483 if (!isalnum(*p) && *p != '.') *p = '-'; /* No need to test '-' ! */
2484 }
2485 }
2486
2487 /* Permit all characters except controls and RFC 2822 specials in the
2488 additional text part. */
2489
2490 if (message_id_text != NULL)
2491 {
2492 uschar *new_id_text = expand_string(message_id_text);
2493 if (new_id_text == NULL)
2494 {
2495 if (!expand_string_forcedfail)
2496 log_write(0, LOG_MAIN|LOG_PANIC,
2497 "expansion of \"%s\" (message_id_header_text) "
2498 "failed: %s", message_id_text, expand_string_message);
2499 }
2500 else if (*new_id_text != 0)
2501 {
2502 id_text = new_id_text;
2503 for (p = id_text; *p != 0; p++)
2504 if (mac_iscntrl_or_special(*p)) *p = '-';
2505 }
2506 }
2507
e7e680d6
PP
2508 /* Add the header line
2509 * Resent-* headers are prepended, per RFC 5322 3.6.6. Non-Resent-* are
2510 * appended, to preserve classical expectations of header ordering. */
059ec3d9 2511
e7e680d6 2512 header_add_at_position(!resents_exist, NULL, FALSE, htype_id,
5eb690a1
NM
2513 "%sMessage-Id: <%s%s%s@%s>\n", resent_prefix, message_id_external,
2514 (*id_text == 0)? "" : ".", id_text, id_domain);
059ec3d9
PH
2515 }
2516
2517/* If we are to log recipients, keep a copy of the raw ones before any possible
2518rewriting. Must copy the count, because later ACLs and the local_scan()
2519function may mess with the real recipients. */
2520
2521if ((log_extra_selector & LX_received_recipients) != 0)
2522 {
2523 raw_recipients = store_get(recipients_count * sizeof(uschar *));
2524 for (i = 0; i < recipients_count; i++)
2525 raw_recipients[i] = string_copy(recipients_list[i].address);
2526 raw_recipients_count = recipients_count;
2527 }
2528
2529/* Ensure the recipients list is fully qualified and rewritten. Unqualified
2530recipients will get here only if the conditions were right (allow_unqualified_
2531recipient is TRUE). */
2532
2533for (i = 0; i < recipients_count; i++)
2534 recipients_list[i].address =
2535 rewrite_address(recipients_list[i].address, TRUE, TRUE,
2536 global_rewrite_rules, rewrite_existflags);
2537
8800895a
PH
2538/* If there is no From: header, generate one for local (without
2539suppress_local_fixups) or submission_mode messages. If there is no sender
2540address, but the sender is local or this is a local delivery error, use the
2541originator login. This shouldn't happen for genuine bounces, but might happen
2542for autoreplies. The addition of From: must be done *before* checking for the
2543possible addition of a Sender: header, because untrusted_set_sender allows an
2544untrusted user to set anything in the envelope (which might then get info
2545From:) but we still want to ensure a valid Sender: if it is required. */
2546
2547if (from_header == NULL &&
2548 ((sender_host_address == NULL && !suppress_local_fixups)
2549 || submission_mode))
059ec3d9 2550 {
2fe1a124
PH
2551 uschar *oname = US"";
2552
2553 /* Use the originator_name if this is a locally submitted message and the
2554 caller is not trusted. For trusted callers, use it only if -F was used to
2555 force its value or if we have a non-SMTP message for which -f was not used
2556 to set the sender. */
2557
2558 if (sender_host_address == NULL)
2559 {
2560 if (!trusted_caller || sender_name_forced ||
2561 (!smtp_input && !sender_address_forced))
2562 oname = originator_name;
2563 }
2564
2565 /* For non-locally submitted messages, the only time we use the originator
2566 name is when it was forced by the /name= option on control=submission. */
2567
2568 else
2569 {
2570 if (submission_name != NULL) oname = submission_name;
2571 }
2572
059ec3d9
PH
2573 /* Envelope sender is empty */
2574
2575 if (sender_address[0] == 0)
2576 {
87ba3f5f
PH
2577 uschar *fromstart, *fromend;
2578
2579 fromstart = string_sprintf("%sFrom: %s%s", resent_prefix,
2fe1a124
PH
2580 oname, (oname[0] == 0)? "" : " <");
2581 fromend = (oname[0] == 0)? US"" : US">";
87ba3f5f 2582
059ec3d9
PH
2583 if (sender_local || local_error_message)
2584 {
87ba3f5f
PH
2585 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2586 local_part_quote(originator_login), qualify_domain_sender,
2587 fromend);
059ec3d9
PH
2588 }
2589 else if (submission_mode && authenticated_id != NULL)
2590 {
2591 if (submission_domain == NULL)
2592 {
87ba3f5f
PH
2593 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2594 local_part_quote(authenticated_id), qualify_domain_sender,
2595 fromend);
059ec3d9
PH
2596 }
2597 else if (submission_domain[0] == 0) /* empty => whole address set */
2598 {
87ba3f5f
PH
2599 header_add(htype_from, "%s%s%s\n", fromstart, authenticated_id,
2600 fromend);
059ec3d9
PH
2601 }
2602 else
2603 {
87ba3f5f
PH
2604 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2605 local_part_quote(authenticated_id), submission_domain,
2606 fromend);
059ec3d9
PH
2607 }
2608 from_header = header_last; /* To get it checked for Sender: */
2609 }
2610 }
2611
2612 /* There is a non-null envelope sender. Build the header using the original
2613 sender address, before any rewriting that might have been done while
2614 verifying it. */
2615
2616 else
2617 {
87ba3f5f 2618 header_add(htype_from, "%sFrom: %s%s%s%s\n", resent_prefix,
2fe1a124
PH
2619 oname,
2620 (oname[0] == 0)? "" : " <",
87ba3f5f
PH
2621 (sender_address_unrewritten == NULL)?
2622 sender_address : sender_address_unrewritten,
2fe1a124 2623 (oname[0] == 0)? "" : ">");
059ec3d9
PH
2624
2625 from_header = header_last; /* To get it checked for Sender: */
2626 }
2627 }
2628
2629
8800895a
PH
2630/* If the sender is local (without suppress_local_fixups), or if we are in
2631submission mode and there is an authenticated_id, check that an existing From:
2632is correct, and if not, generate a Sender: header, unless disabled. Any
2633previously-existing Sender: header was removed above. Note that sender_local,
2634as well as being TRUE if the caller of exim is not trusted, is also true if a
2635trusted caller did not supply a -f argument for non-smtp input. To allow
2636trusted callers to forge From: without supplying -f, we have to test explicitly
2637here. If the From: header contains more than one address, then the call to
2638parse_extract_address fails, and a Sender: header is inserted, as required. */
059ec3d9
PH
2639
2640if (from_header != NULL &&
69358f02 2641 (active_local_from_check &&
8800895a 2642 ((sender_local && !trusted_caller && !suppress_local_fixups) ||
69358f02 2643 (submission_mode && authenticated_id != NULL))
059ec3d9
PH
2644 ))
2645 {
2646 BOOL make_sender = TRUE;
2647 int start, end, domain;
2648 uschar *errmess;
2649 uschar *from_address =
2650 parse_extract_address(Ustrchr(from_header->text, ':') + 1, &errmess,
2651 &start, &end, &domain, FALSE);
2652 uschar *generated_sender_address;
2653
2654 if (submission_mode)
2655 {
2656 if (submission_domain == NULL)
2657 {
2658 generated_sender_address = string_sprintf("%s@%s",
2659 local_part_quote(authenticated_id), qualify_domain_sender);
2660 }
2661 else if (submission_domain[0] == 0) /* empty => full address */
2662 {
2663 generated_sender_address = string_sprintf("%s",
2664 authenticated_id);
2665 }
2666 else
2667 {
2668 generated_sender_address = string_sprintf("%s@%s",
2669 local_part_quote(authenticated_id), submission_domain);
2670 }
2671 }
2672 else
2673 generated_sender_address = string_sprintf("%s@%s",
2674 local_part_quote(originator_login), qualify_domain_sender);
2675
2676 /* Remove permitted prefixes and suffixes from the local part of the From:
2677 address before doing the comparison with the generated sender. */
2678
2679 if (from_address != NULL)
2680 {
2681 int slen;
2682 uschar *at = (domain == 0)? NULL : from_address + domain - 1;
2683
2684 if (at != NULL) *at = 0;
2685 from_address += route_check_prefix(from_address, local_from_prefix);
2686 slen = route_check_suffix(from_address, local_from_suffix);
2687 if (slen > 0)
2688 {
2689 memmove(from_address+slen, from_address, Ustrlen(from_address)-slen);
2690 from_address += slen;
2691 }
2692 if (at != NULL) *at = '@';
2693
2694 if (strcmpic(generated_sender_address, from_address) == 0 ||
2695 (domain == 0 && strcmpic(from_address, originator_login) == 0))
2696 make_sender = FALSE;
2697 }
2698
2699 /* We have to cause the Sender header to be rewritten if there are
2700 appropriate rewriting rules. */
2701
2702 if (make_sender)
2703 {
2fe1a124 2704 if (submission_mode && submission_name == NULL)
059ec3d9
PH
2705 header_add(htype_sender, "%sSender: %s\n", resent_prefix,
2706 generated_sender_address);
2707 else
2708 header_add(htype_sender, "%sSender: %s <%s>\n",
2fe1a124
PH
2709 resent_prefix,
2710 submission_mode? submission_name : originator_name,
2711 generated_sender_address);
059ec3d9 2712 }
87ba3f5f
PH
2713
2714 /* Ensure that a non-null envelope sender address corresponds to the
2715 submission mode sender address. */
2716
2717 if (submission_mode && sender_address[0] != 0)
2718 {
2719 if (sender_address_unrewritten == NULL)
2720 sender_address_unrewritten = sender_address;
2721 sender_address = generated_sender_address;
089793a4
TF
2722 if (Ustrcmp(sender_address_unrewritten, generated_sender_address) != 0)
2723 log_write(L_address_rewrite, LOG_MAIN,
2724 "\"%s\" from env-from rewritten as \"%s\" by submission mode",
2725 sender_address_unrewritten, generated_sender_address);
87ba3f5f 2726 }
059ec3d9
PH
2727 }
2728
059ec3d9
PH
2729/* If there are any rewriting rules, apply them to the sender address, unless
2730it has already been rewritten as part of verification for SMTP input. */
2731
2732if (global_rewrite_rules != NULL && sender_address_unrewritten == NULL &&
2733 sender_address[0] != 0)
2734 {
2735 sender_address = rewrite_address(sender_address, FALSE, TRUE,
2736 global_rewrite_rules, rewrite_existflags);
2737 DEBUG(D_receive|D_rewrite)
2738 debug_printf("rewritten sender = %s\n", sender_address);
2739 }
2740
2741
2742/* The headers must be run through rewrite_header(), because it ensures that
2743addresses are fully qualified, as well as applying any rewriting rules that may
2744exist.
2745
2746Qualification of header addresses in a message from a remote host happens only
2747if the host is in sender_unqualified_hosts or recipient_unqualified hosts, as
2748appropriate. For local messages, qualification always happens, unless -bnq is
2749used to explicitly suppress it. No rewriting is done for an unqualified address
2750that is left untouched.
2751
2752We start at the second header, skipping our own Received:. This rewriting is
2753documented as happening *after* recipient addresses are taken from the headers
2754by the -t command line option. An added Sender: gets rewritten here. */
2755
2756for (h = header_list->next; h != NULL; h = h->next)
2757 {
2758 header_line *newh = rewrite_header(h, NULL, NULL, global_rewrite_rules,
2759 rewrite_existflags, TRUE);
2760 if (newh != NULL) h = newh;
2761 }
2762
2763
2764/* An RFC 822 (sic) message is not legal unless it has at least one of "to",
2cbb4081 2765"cc", or "bcc". Note that although the minimal examples in RFC 822 show just
059ec3d9
PH
2766"to" or "bcc", the full syntax spec allows "cc" as well. If any resent- header
2767exists, this applies to the set of resent- headers rather than the normal set.
2768
2cbb4081
PH
2769The requirement for a recipient header has been removed in RFC 2822. At this
2770point in the code, earlier versions of Exim added a To: header for locally
2771submitted messages, and an empty Bcc: header for others. In the light of the
2772changes in RFC 2822, this was dropped in November 2003. */
059ec3d9 2773
059ec3d9
PH
2774
2775/* If there is no date header, generate one if the message originates locally
8800895a
PH
2776(i.e. not over TCP/IP) and suppress_local_fixups is not set, or if the
2777submission mode flag is set. Messages without Date: are not valid, but it seems
e7e680d6
PP
2778to be more confusing if Exim adds one to all remotely-originated messages.
2779As per Message-Id, we prepend if resending, else append.
2780*/
059ec3d9 2781
8800895a
PH
2782if (!date_header_exists &&
2783 ((sender_host_address == NULL && !suppress_local_fixups)
2784 || submission_mode))
e7e680d6
PP
2785 header_add_at_position(!resents_exist, NULL, FALSE, htype_other,
2786 "%sDate: %s\n", resent_prefix, tod_stamp(tod_full));
059ec3d9
PH
2787
2788search_tidyup(); /* Free any cached resources */
2789
2790/* Show the complete set of headers if debugging. Note that the first one (the
2791new Received:) has not yet been set. */
2792
2793DEBUG(D_receive)
2794 {
2795 debug_printf(">>Headers after rewriting and local additions:\n");
2796 for (h = header_list->next; h != NULL; h = h->next)
2797 debug_printf("%c %s", h->type, h->text);
2798 debug_printf("\n");
2799 }
2800
2801/* The headers are now complete in store. If we are running in filter
2802testing mode, that is all this function does. Return TRUE if the message
2803ended with a dot. */
2804
f05da2e8 2805if (filter_test != FTEST_NONE)
059ec3d9
PH
2806 {
2807 process_info[process_info_len] = 0;
2808 return message_ended == END_DOT;
2809 }
2810
817d9f57 2811/* Cutthrough delivery:
e4bdf652
JH
2812 We have to create the Received header now rather than at the end of reception,
2813 so the timestamp behaviour is a change to the normal case.
2814 XXX Ensure this gets documented XXX.
817d9f57 2815 Having created it, send the headers to the destination.
e4bdf652
JH
2816*/
2817if (cutthrough_fd >= 0)
2818 {
817d9f57
JH
2819 if (received_count > received_headers_max)
2820 {
2e5b33cd 2821 cancel_cutthrough_connection("too many headers");
817d9f57
JH
2822 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2823 log_write(0, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2824 "Too many \"Received\" headers",
2825 sender_address,
2826 (sender_fullhost == NULL)? "" : " H=",
2827 (sender_fullhost == NULL)? US"" : sender_fullhost,
2828 (sender_ident == NULL)? "" : " U=",
2829 (sender_ident == NULL)? US"" : sender_ident);
2830 message_id[0] = 0; /* Indicate no message accepted */
2831 smtp_reply = US"550 Too many \"Received\" headers - suspected mail loop";
2832 goto TIDYUP; /* Skip to end of function */
2833 }
e4bdf652 2834 received_header_gen();
578d43dc 2835 add_acl_headers(ACL_WHERE_RCPT, US"MAIL or RCPT");
e4bdf652
JH
2836 (void) cutthrough_headers_send();
2837 }
61147df4 2838
e4bdf652 2839
059ec3d9
PH
2840/* Open a new spool file for the data portion of the message. We need
2841to access it both via a file descriptor and a stream. Try to make the
2842directory if it isn't there. Note re use of sprintf: spool_directory
2843is checked on input to be < 200 characters long. */
2844
2845sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory, message_subdir,
2846 message_id);
2847data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2848if (data_fd < 0)
2849 {
2850 if (errno == ENOENT)
2851 {
2852 uschar temp[16];
2853 sprintf(CS temp, "input/%s", message_subdir);
2854 if (message_subdir[0] == 0) temp[5] = 0;
2855 (void)directory_make(spool_directory, temp, INPUT_DIRECTORY_MODE, TRUE);
2856 data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2857 }
2858 if (data_fd < 0)
2859 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Failed to create spool file %s: %s",
2860 spool_name, strerror(errno));
2861 }
2862
2863/* Make sure the file's group is the Exim gid, and double-check the mode
2864because the group setting doesn't always get set automatically. */
2865
1ac6b2e7
JH
2866if (fchown(data_fd, exim_uid, exim_gid))
2867 log_write(0, LOG_MAIN|LOG_PANIC_DIE,
2868 "Failed setting ownership on spool file %s: %s",
2869 spool_name, strerror(errno));
ff790e47 2870(void)fchmod(data_fd, SPOOL_MODE);
059ec3d9
PH
2871
2872/* We now have data file open. Build a stream for it and lock it. We lock only
2873the first line of the file (containing the message ID) because otherwise there
2874are problems when Exim is run under Cygwin (I'm told). See comments in
2875spool_in.c, where the same locking is done. */
2876
2877data_file = fdopen(data_fd, "w+");
2878lock_data.l_type = F_WRLCK;
2879lock_data.l_whence = SEEK_SET;
2880lock_data.l_start = 0;
2881lock_data.l_len = SPOOL_DATA_START_OFFSET;
2882
2883if (fcntl(data_fd, F_SETLK, &lock_data) < 0)
2884 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Cannot lock %s (%d): %s", spool_name,
2885 errno, strerror(errno));
2886
2887/* We have an open, locked data file. Write the message id to it to make it
2888self-identifying. Then read the remainder of the input of this message and
2889write it to the data file. If the variable next != NULL, it contains the first
2890data line (which was read as a header but then turned out not to have the right
2891format); write it (remembering that it might contain binary zeros). The result
2892of fwrite() isn't inspected; instead we call ferror() below. */
2893
2894fprintf(data_file, "%s-D\n", message_id);
2895if (next != NULL)
2896 {
2897 uschar *s = next->text;
2898 int len = next->slen;
1ac6b2e7 2899 len = fwrite(s, 1, len, data_file); len = len; /* compiler quietening */
059ec3d9
PH
2900 body_linecount++; /* Assumes only 1 line */
2901 }
2902
2903/* Note that we might already be at end of file, or the logical end of file
2904(indicated by '.'), or might have encountered an error while writing the
2905message id or "next" line. */
2906
2907if (!ferror(data_file) && !(receive_feof)() && message_ended != END_DOT)
2908 {
2909 if (smtp_input)
2910 {
2911 message_ended = read_message_data_smtp(data_file);
2912 receive_linecount++; /* The terminating "." line */
2913 }
2914 else message_ended = read_message_data(data_file);
2915
2916 receive_linecount += body_linecount; /* For BSMTP errors mainly */
2e0c1448 2917 message_linecount += body_linecount;
059ec3d9
PH
2918
2919 /* Handle premature termination of SMTP */
2920
2921 if (smtp_input && message_ended == END_EOF)
2922 {
2923 Uunlink(spool_name); /* Lose data file when closed */
2e5b33cd 2924 cancel_cutthrough_connection("sender closed connection");
059ec3d9
PH
2925 message_id[0] = 0; /* Indicate no message accepted */
2926 smtp_reply = handle_lost_connection(US"");
2927 smtp_yield = FALSE;
2928 goto TIDYUP; /* Skip to end of function */
2929 }
2930
2931 /* Handle message that is too big. Don't use host_or_ident() in the log
2932 message; we want to see the ident value even for non-remote messages. */
2933
2934 if (message_ended == END_SIZE)
2935 {
2936 Uunlink(spool_name); /* Lose the data file when closed */
2e5b33cd 2937 cancel_cutthrough_connection("mail too big");
059ec3d9
PH
2938 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2939
2940 log_write(L_size_reject, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2941 "message too big: read=%d max=%d",
2942 sender_address,
2943 (sender_fullhost == NULL)? "" : " H=",
2944 (sender_fullhost == NULL)? US"" : sender_fullhost,
2945 (sender_ident == NULL)? "" : " U=",
2946 (sender_ident == NULL)? US"" : sender_ident,
2947 message_size,
2948 thismessage_size_limit);
2949
2950 if (smtp_input)
2951 {
2952 smtp_reply = US"552 Message size exceeds maximum permitted";
2953 message_id[0] = 0; /* Indicate no message accepted */
2954 goto TIDYUP; /* Skip to end of function */
2955 }
2956 else
2957 {
2958 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2959 give_local_error(ERRMESS_TOOBIG,
2960 string_sprintf("message too big (max=%d)", thismessage_size_limit),
2961 US"message rejected: ", error_rc, data_file, header_list);
2962 /* Does not return */
2963 }
2964 }
2965 }
2966
2967/* Restore the standard SIGALRM handler for any subsequent processing. (For
2968example, there may be some expansion in an ACL that uses a timer.) */
2969
2970os_non_restarting_signal(SIGALRM, sigalrm_handler);
2971
2972/* The message body has now been read into the data file. Call fflush() to
2973empty the buffers in C, and then call fsync() to get the data written out onto
2974the disk, as fflush() doesn't do this (or at least, it isn't documented as
2975having to do this). If there was an I/O error on either input or output,
2976attempt to send an error message, and unlink the spool file. For non-SMTP input
2977we can then give up. Note that for SMTP input we must swallow the remainder of
2978the input in cases of output errors, since the far end doesn't expect to see
2979anything until the terminating dot line is sent. */
2980
2981if (fflush(data_file) == EOF || ferror(data_file) ||
54fc8428 2982 EXIMfsync(fileno(data_file)) < 0 || (receive_ferror)())
059ec3d9
PH
2983 {
2984 uschar *msg_errno = US strerror(errno);
2985 BOOL input_error = (receive_ferror)() != 0;
2986 uschar *msg = string_sprintf("%s error (%s) while receiving message from %s",
2987 input_error? "Input read" : "Spool write",
2988 msg_errno,
2989 (sender_fullhost != NULL)? sender_fullhost : sender_ident);
2990
2991 log_write(0, LOG_MAIN, "Message abandoned: %s", msg);
2992 Uunlink(spool_name); /* Lose the data file */
2e5b33cd 2993 cancel_cutthrough_connection("error writing spoolfile");
059ec3d9
PH
2994
2995 if (smtp_input)
2996 {
2997 if (input_error)
2998 smtp_reply = US"451 Error while reading input data";
2999 else
3000 {
3001 smtp_reply = US"451 Error while writing spool file";
3002 receive_swallow_smtp();
3003 }
3004 message_id[0] = 0; /* Indicate no message accepted */
3005 goto TIDYUP; /* Skip to end of function */
3006 }
3007
3008 else
3009 {
3010 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3011 give_local_error(ERRMESS_IOERR, msg, US"", error_rc, data_file,
3012 header_list);
3013 /* Does not return */
3014 }
3015 }
3016
3017
3018/* No I/O errors were encountered while writing the data file. */
3019
3020DEBUG(D_receive) debug_printf("Data file written for message %s\n", message_id);
3021
3022
3023/* If there were any bad addresses extracted by -t, or there were no recipients
3024left after -t, send a message to the sender of this message, or write it to
3025stderr if the error handling option is set that way. Note that there may
3026legitimately be no recipients for an SMTP message if they have all been removed
3027by "discard".
3028
3029We need to rewind the data file in order to read it. In the case of no
3030recipients or stderr error writing, throw the data file away afterwards, and
3031exit. (This can't be SMTP, which always ensures there's at least one
3032syntactically good recipient address.) */
3033
3034if (extract_recip && (bad_addresses != NULL || recipients_count == 0))
3035 {
3036 DEBUG(D_receive)
3037 {
3038 if (recipients_count == 0) debug_printf("*** No recipients\n");
3039 if (bad_addresses != NULL)
3040 {
3041 error_block *eblock = bad_addresses;
3042 debug_printf("*** Bad address(es)\n");
3043 while (eblock != NULL)
3044 {
3045 debug_printf(" %s: %s\n", eblock->text1, eblock->text2);
3046 eblock = eblock->next;
3047 }
3048 }
3049 }
3050
3051 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3052
3053 /* If configured to send errors to the sender, but this fails, force
3054 a failure error code. We use a special one for no recipients so that it
3055 can be detected by the autoreply transport. Otherwise error_rc is set to
3056 errors_sender_rc, which is EXIT_FAILURE unless -oee was given, in which case
3057 it is EXIT_SUCCESS. */
3058
3059 if (error_handling == ERRORS_SENDER)
3060 {
3061 if (!moan_to_sender(
3062 (bad_addresses == NULL)?
3063 (extracted_ignored? ERRMESS_IGADDRESS : ERRMESS_NOADDRESS) :
3064 (recipients_list == NULL)? ERRMESS_BADNOADDRESS : ERRMESS_BADADDRESS,
3065 bad_addresses, header_list, data_file, FALSE))
3066 error_rc = (bad_addresses == NULL)? EXIT_NORECIPIENTS : EXIT_FAILURE;
3067 }
3068 else
3069 {
3070 if (bad_addresses == NULL)
3071 {
3072 if (extracted_ignored)
3073 fprintf(stderr, "exim: all -t recipients overridden by command line\n");
3074 else
3075 fprintf(stderr, "exim: no recipients in message\n");
3076 }
3077 else
3078 {
3079 fprintf(stderr, "exim: invalid address%s",
3080 (bad_addresses->next == NULL)? ":" : "es:\n");
3081 while (bad_addresses != NULL)
3082 {
3083 fprintf(stderr, " %s: %s\n", bad_addresses->text1,
3084 bad_addresses->text2);
3085 bad_addresses = bad_addresses->next;
3086 }
3087 }
3088 }
3089
3090 if (recipients_count == 0 || error_handling == ERRORS_STDERR)
3091 {
3092 Uunlink(spool_name);
f1e894f3 3093 (void)fclose(data_file);
059ec3d9
PH
3094 exim_exit(error_rc);
3095 }
3096 }
3097
3098/* Data file successfully written. Generate text for the Received: header by
3099expanding the configured string, and adding a timestamp. By leaving this
3100operation till now, we ensure that the timestamp is the time that message
3101reception was completed. However, this is deliberately done before calling the
3102data ACL and local_scan().
3103
3104This Received: header may therefore be inspected by the data ACL and by code in
3105the local_scan() function. When they have run, we update the timestamp to be
3106the final time of reception.
3107
3108If there is just one recipient, set up its value in the $received_for variable
3109for use when we generate the Received: header.
3110
3111Note: the checking for too many Received: headers is handled by the delivery
3112code. */
e4bdf652 3113/*XXX eventually add excess Received: check for cutthrough case back when classifying them */
059ec3d9 3114
e4bdf652 3115if (received_header->text == NULL) /* Non-cutthrough case */
059ec3d9 3116 {
e4bdf652 3117 received_header_gen();
059ec3d9 3118
e4bdf652 3119 /* Set the value of message_body_size for the DATA ACL and for local_scan() */
059ec3d9 3120
e4bdf652
JH
3121 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3122 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9 3123
e4bdf652
JH
3124 /* If an ACL from any RCPT commands set up any warning headers to add, do so
3125 now, before running the DATA ACL. */
059ec3d9 3126
578d43dc 3127 add_acl_headers(ACL_WHERE_RCPT, US"MAIL or RCPT");
e4bdf652 3128 }
817d9f57 3129else
e4bdf652
JH
3130 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3131 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9
PH
3132
3133/* If an ACL is specified for checking things at this stage of reception of a
3134message, run it, unless all the recipients were removed by "discard" in earlier
3135ACLs. That is the only case in which recipients_count can be zero at this
3136stage. Set deliver_datafile to point to the data file so that $message_body and
3137$message_body_end can be extracted if needed. Allow $recipients in expansions.
3138*/
3139
3140deliver_datafile = data_fd;
4e88a19f 3141user_msg = NULL;
059ec3d9 3142
0e20aff9
MH
3143enable_dollar_recipients = TRUE;
3144
059ec3d9
PH
3145if (recipients_count == 0)
3146 {
3147 blackholed_by = recipients_discarded? US"MAIL ACL" : US"RCPT ACL";
3148 }
3149else
3150 {
059ec3d9
PH
3151 /* Handle interactive SMTP messages */
3152
3153 if (smtp_input && !smtp_batched_input)
3154 {
8523533c 3155
80a47a2c
TK
3156#ifndef DISABLE_DKIM
3157 if (!dkim_disable_verify)
3158 {
3159 /* Finish verification, this will log individual signature results to
3160 the mainlog */
3161 dkim_exim_verify_finish();
3162
3163 /* Check if we must run the DKIM ACL */
3164 if ((acl_smtp_dkim != NULL) &&
3165 (dkim_verify_signers != NULL) &&
3166 (dkim_verify_signers[0] != '\0'))
3167 {
3168 uschar *dkim_verify_signers_expanded =
3169 expand_string(dkim_verify_signers);
3170 if (dkim_verify_signers_expanded == NULL)
3171 {
3172 log_write(0, LOG_MAIN|LOG_PANIC,
3173 "expansion of dkim_verify_signers option failed: %s",
3174 expand_string_message);
3175 }
3176 else
3177 {
3178 int sep = 0;
3179 uschar *ptr = dkim_verify_signers_expanded;
3180 uschar *item = NULL;
9e5d6b55
TK
3181 uschar *seen_items = NULL;
3182 int seen_items_size = 0;
3183 int seen_items_offset = 0;
80a47a2c 3184 uschar itembuf[256];
9122af94
TK
3185 /* Default to OK when no items are present */
3186 rc = OK;
80a47a2c
TK
3187 while ((item = string_nextinlist(&ptr, &sep,
3188 itembuf,
3189 sizeof(itembuf))) != NULL)
3190 {
6119d1ea
TK
3191 /* Prevent running ACL for an empty item */
3192 if (!item || (item[0] == '\0')) continue;
9e5d6b55
TK
3193 /* Only run ACL once for each domain or identity, no matter how often it
3194 appears in the expanded list. */
6119d1ea
TK
3195 if (seen_items != NULL)
3196 {
ae9094bf
TK
3197 uschar *seen_item = NULL;
3198 uschar seen_item_buf[256];
4a73449b 3199 uschar *seen_items_list = seen_items;
ae9094bf 3200 int seen_this_item = 0;
61147df4 3201
ae9094bf
TK
3202 while ((seen_item = string_nextinlist(&seen_items_list, &sep,
3203 seen_item_buf,
3204 sizeof(seen_item_buf))) != NULL)
3205 {
3206 if (Ustrcmp(seen_item,item) == 0)
3207 {
3208 seen_this_item = 1;
3209 break;
61147df4 3210 }
ae9094bf
TK
3211 }
3212
3213 if (seen_this_item > 0)
6119d1ea
TK
3214 {
3215 DEBUG(D_receive)
3216 debug_printf("acl_smtp_dkim: skipping signer %s, already seen\n", item);
3217 continue;
3218 }
61147df4 3219
4a73449b 3220 seen_items = string_append(seen_items,&seen_items_size,&seen_items_offset,1,":");
6119d1ea
TK
3221 }
3222
4a73449b
TK
3223 seen_items = string_append(seen_items,&seen_items_size,&seen_items_offset,1,item);
3224 seen_items[seen_items_offset] = '\0';
6119d1ea
TK
3225
3226 DEBUG(D_receive)
3227 debug_printf("calling acl_smtp_dkim for dkim_cur_signer=%s\n", item);
3228
80a47a2c
TK
3229 dkim_exim_acl_setup(item);
3230 rc = acl_check(ACL_WHERE_DKIM, NULL, acl_smtp_dkim, &user_msg, &log_msg);
6119d1ea
TK
3231
3232 if (rc != OK)
3233 {
3234 DEBUG(D_receive)
3235 debug_printf("acl_smtp_dkim: acl_check returned %d on %s, skipping remaining items\n", rc, item);
2e5b33cd 3236 cancel_cutthrough_connection("dkim acl not ok");
6119d1ea
TK
3237 break;
3238 }
80a47a2c 3239 }
578d43dc 3240 add_acl_headers(ACL_WHERE_DKIM, US"DKIM");
80a47a2c
TK
3241 if (rc == DISCARD)
3242 {
3243 recipients_count = 0;
3244 blackholed_by = US"DKIM ACL";
3245 if (log_msg != NULL)
3246 blackhole_log_msg = string_sprintf(": %s", log_msg);
3247 }
3248 else if (rc != OK)
3249 {
3250 Uunlink(spool_name);
3251 if (smtp_handle_acl_fail(ACL_WHERE_DKIM, rc, user_msg, log_msg) != 0)
3252 smtp_yield = FALSE; /* No more messsages after dropped connection */
3253 smtp_reply = US""; /* Indicate reply already sent */
3254 message_id[0] = 0; /* Indicate no message accepted */
3255 goto TIDYUP; /* Skip to end of function */
3256 }
3257 }
3258 }
3259 }
4a8ce2d8 3260#endif /* DISABLE_DKIM */
fb2274d4 3261
8523533c 3262#ifdef WITH_CONTENT_SCAN
80a47a2c
TK
3263 if (recipients_count > 0 &&
3264 acl_smtp_mime != NULL &&
54cdb463
PH
3265 !run_mime_acl(acl_smtp_mime, &smtp_yield, &smtp_reply, &blackholed_by))
3266 goto TIDYUP;
8523533c
TK
3267#endif /* WITH_CONTENT_SCAN */
3268
4840604e
TL
3269#ifdef EXPERIMENTAL_DMARC
3270 dmarc_up = dmarc_store_data(from_header);
3271#endif /* EXPERIMENTAL_DMARC */
3272
8ccd00b1
JH
3273#ifndef DISABLE_PRDR
3274 if (prdr_requested && recipients_count > 1 && acl_smtp_data_prdr)
fd98a5c6
JH
3275 {
3276 unsigned int c;
3277 int all_pass = OK;
3278 int all_fail = FAIL;
3279
3280 smtp_printf("353 PRDR content analysis beginning\r\n");
3281 /* Loop through recipients, responses must be in same order received */
3282 for (c = 0; recipients_count > c; c++)
3283 {
3284 uschar * addr= recipients_list[c].address;
3285 uschar * msg= US"PRDR R=<%s> %s";
3286 uschar * code;
3287 DEBUG(D_receive)
3288 debug_printf("PRDR processing recipient %s (%d of %d)\n",
3289 addr, c+1, recipients_count);
3290 rc = acl_check(ACL_WHERE_PRDR, addr,
3291 acl_smtp_data_prdr, &user_msg, &log_msg);
3292
3293 /* If any recipient rejected content, indicate it in final message */
3294 all_pass |= rc;
3295 /* If all recipients rejected, indicate in final message */
3296 all_fail &= rc;
3297
3298 switch (rc)
3299 {
3300 case OK: case DISCARD: code = US"250"; break;
3301 case DEFER: code = US"450"; break;
3302 default: code = US"550"; break;
3303 }
3304 if (user_msg != NULL)
3305 smtp_user_msg(code, user_msg);
3306 else
3307 {
3308 switch (rc)
3309 {
3310 case OK: case DISCARD:
3311 msg = string_sprintf(CS msg, addr, "acceptance"); break;
3312 case DEFER:
3313 msg = string_sprintf(CS msg, addr, "temporary refusal"); break;
3314 default:
3315 msg = string_sprintf(CS msg, addr, "refusal"); break;
3316 }
3317 smtp_user_msg(code, msg);
3318 }
3319 if (log_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, log_msg);
3320 else if (user_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, user_msg);
112b6a93 3321 else log_write(0, LOG_MAIN, "%s", CS msg);
fd98a5c6
JH
3322
3323 if (rc != OK) { receive_remove_recipient(addr); c--; }
3324 }
3325 /* Set up final message, used if data acl gives OK */
3326 smtp_reply = string_sprintf("%s id=%s message %s",
3327 all_fail == FAIL ? US"550" : US"250",
3328 message_id,
3329 all_fail == FAIL
3330 ? US"rejected for all recipients"
3331 : all_pass == OK
3332 ? US"accepted"
3333 : US"accepted for some recipients");
3334 if (recipients_count == 0)
3335 {
3336 message_id[0] = 0; /* Indicate no message accepted */
3337 goto TIDYUP;
3338 }
3339 }
3340 else
3341 prdr_requested = FALSE;
8ccd00b1 3342#endif /* !DISABLE_PRDR */
fd98a5c6 3343
54cdb463
PH
3344 /* Check the recipients count again, as the MIME ACL might have changed
3345 them. */
8523533c 3346
059ec3d9
PH
3347 if (acl_smtp_data != NULL && recipients_count > 0)
3348 {
059ec3d9 3349 rc = acl_check(ACL_WHERE_DATA, NULL, acl_smtp_data, &user_msg, &log_msg);
578d43dc 3350 add_acl_headers(ACL_WHERE_DATA, US"DATA");
059ec3d9
PH
3351 if (rc == DISCARD)
3352 {
3353 recipients_count = 0;
3354 blackholed_by = US"DATA ACL";
8e669ac1
PH
3355 if (log_msg != NULL)
3356 blackhole_log_msg = string_sprintf(": %s", log_msg);
2e5b33cd 3357 cancel_cutthrough_connection("data acl discard");
059ec3d9
PH
3358 }
3359 else if (rc != OK)
3360 {
3361 Uunlink(spool_name);
2e5b33cd 3362 cancel_cutthrough_connection("data acl not ok");
8523533c
TK
3363#ifdef WITH_CONTENT_SCAN
3364 unspool_mbox();
6f0c431a
PP
3365#endif
3366#ifdef EXPERIMENTAL_DCC
3367 dcc_ok = 0;
8523533c 3368#endif
059ec3d9
PH
3369 if (smtp_handle_acl_fail(ACL_WHERE_DATA, rc, user_msg, log_msg) != 0)
3370 smtp_yield = FALSE; /* No more messsages after dropped connection */
3371 smtp_reply = US""; /* Indicate reply already sent */
3372 message_id[0] = 0; /* Indicate no message accepted */
3373 goto TIDYUP; /* Skip to end of function */
3374 }
3375 }
3376 }
3377
3378 /* Handle non-SMTP and batch SMTP (i.e. non-interactive) messages. Note that
3379 we cannot take different actions for permanent and temporary rejections. */
3380
54cdb463 3381 else
059ec3d9 3382 {
54cdb463
PH
3383
3384#ifdef WITH_CONTENT_SCAN
3385 if (acl_not_smtp_mime != NULL &&
3386 !run_mime_acl(acl_not_smtp_mime, &smtp_yield, &smtp_reply,
3387 &blackholed_by))
3388 goto TIDYUP;
3389#endif /* WITH_CONTENT_SCAN */
3390
3391 if (acl_not_smtp != NULL)
059ec3d9 3392 {
54cdb463
PH
3393 uschar *user_msg, *log_msg;
3394 rc = acl_check(ACL_WHERE_NOTSMTP, NULL, acl_not_smtp, &user_msg, &log_msg);
3395 if (rc == DISCARD)
059ec3d9 3396 {
54cdb463
PH
3397 recipients_count = 0;
3398 blackholed_by = US"non-SMTP ACL";
3399 if (log_msg != NULL)
3400 blackhole_log_msg = string_sprintf(": %s", log_msg);
059ec3d9 3401 }
54cdb463 3402 else if (rc != OK)
059ec3d9 3403 {
54cdb463
PH
3404 Uunlink(spool_name);
3405#ifdef WITH_CONTENT_SCAN
3406 unspool_mbox();
6f0c431a
PP
3407#endif
3408#ifdef EXPERIMENTAL_DCC
3409 dcc_ok = 0;
54cdb463 3410#endif
6ea85e9a
PH
3411 /* The ACL can specify where rejections are to be logged, possibly
3412 nowhere. The default is main and reject logs. */
3413
3414 if (log_reject_target != 0)
3415 log_write(0, log_reject_target, "F=<%s> rejected by non-SMTP ACL: %s",
3416 sender_address, log_msg);
3417
54cdb463
PH
3418 if (user_msg == NULL) user_msg = US"local configuration problem";
3419 if (smtp_batched_input)
3420 {
3421 moan_smtp_batch(NULL, "%d %s", 550, user_msg);
3422 /* Does not return */
3423 }
3424 else
3425 {
3426 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3427 give_local_error(ERRMESS_LOCAL_ACL, user_msg,
3428 US"message rejected by non-SMTP ACL: ", error_rc, data_file,
3429 header_list);
3430 /* Does not return */
3431 }
059ec3d9 3432 }
578d43dc 3433 add_acl_headers(ACL_WHERE_NOTSMTP, US"non-SMTP");
059ec3d9 3434 }
059ec3d9
PH
3435 }
3436
54cdb463
PH
3437 /* The applicable ACLs have been run */
3438
059ec3d9
PH
3439 if (deliver_freeze) frozen_by = US"ACL"; /* for later logging */
3440 if (queue_only_policy) queued_by = US"ACL";
059ec3d9
PH
3441 }
3442
8523533c
TK
3443#ifdef WITH_CONTENT_SCAN
3444unspool_mbox();
3445#endif
3446
6a8f9482
TK
3447#ifdef EXPERIMENTAL_DCC
3448dcc_ok = 0;
3449#endif
3450
3451
059ec3d9
PH
3452/* The final check on the message is to run the scan_local() function. The
3453version supplied with Exim always accepts, but this is a hook for sysadmins to
3454supply their own checking code. The local_scan() function is run even when all
3455the recipients have been discarded. */
3456
3457lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3458
3459/* Arrange to catch crashes in local_scan(), so that the -D file gets
3460deleted, and the incident gets logged. */
3461
3462os_non_restarting_signal(SIGSEGV, local_scan_crash_handler);
3463os_non_restarting_signal(SIGFPE, local_scan_crash_handler);
3464os_non_restarting_signal(SIGILL, local_scan_crash_handler);
3465os_non_restarting_signal(SIGBUS, local_scan_crash_handler);
3466
3467DEBUG(D_receive) debug_printf("calling local_scan(); timeout=%d\n",
3468 local_scan_timeout);
3469local_scan_data = NULL;
3470
3471os_non_restarting_signal(SIGALRM, local_scan_timeout_handler);
3472if (local_scan_timeout > 0) alarm(local_scan_timeout);
3473rc = local_scan(data_fd, &local_scan_data);
3474alarm(0);
3475os_non_restarting_signal(SIGALRM, sigalrm_handler);
3476
0e20aff9
MH
3477enable_dollar_recipients = FALSE;
3478
059ec3d9
PH
3479store_pool = POOL_MAIN; /* In case changed */
3480DEBUG(D_receive) debug_printf("local_scan() returned %d %s\n", rc,
3481 local_scan_data);
3482
3483os_non_restarting_signal(SIGSEGV, SIG_DFL);
3484os_non_restarting_signal(SIGFPE, SIG_DFL);
3485os_non_restarting_signal(SIGILL, SIG_DFL);
3486os_non_restarting_signal(SIGBUS, SIG_DFL);
3487
3488/* The length check is paranoia against some runaway code, and also because
3489(for a success return) lines in the spool file are read into big_buffer. */
3490
3491if (local_scan_data != NULL)
3492 {
3493 int len = Ustrlen(local_scan_data);
3494 if (len > LOCAL_SCAN_MAX_RETURN) len = LOCAL_SCAN_MAX_RETURN;
3495 local_scan_data = string_copyn(local_scan_data, len);
3496 }
3497
3498if (rc == LOCAL_SCAN_ACCEPT_FREEZE)
3499 {
58eb016e 3500 if (!deliver_freeze) /* ACL might have already frozen */
059ec3d9
PH
3501 {
3502 deliver_freeze = TRUE;
3503 deliver_frozen_at = time(NULL);
3504 frozen_by = US"local_scan()";
3505 }
3506 rc = LOCAL_SCAN_ACCEPT;
3507 }
3508else if (rc == LOCAL_SCAN_ACCEPT_QUEUE)
3509 {
3510 if (!queue_only_policy) /* ACL might have already queued */
3511 {
3512 queue_only_policy = TRUE;
3513 queued_by = US"local_scan()";
3514 }
3515 rc = LOCAL_SCAN_ACCEPT;
3516 }
3517
3518/* Message accepted: remove newlines in local_scan_data because otherwise
3519the spool file gets corrupted. Ensure that all recipients are qualified. */
3520
3521if (rc == LOCAL_SCAN_ACCEPT)
3522 {
3523 if (local_scan_data != NULL)
3524 {
3525 uschar *s;
3526 for (s = local_scan_data; *s != 0; s++) if (*s == '\n') *s = ' ';
3527 }
3528 for (i = 0; i < recipients_count; i++)
3529 {
3530 recipient_item *r = recipients_list + i;
3531 r->address = rewrite_address_qualify(r->address, TRUE);
3532 if (r->errors_to != NULL)
3533 r->errors_to = rewrite_address_qualify(r->errors_to, TRUE);
3534 }
3535 if (recipients_count == 0 && blackholed_by == NULL)
3536 blackholed_by = US"local_scan";
3537 }
3538
3539/* Message rejected: newlines permitted in local_scan_data to generate
3540multiline SMTP responses. */
3541
3542else
3543 {
3544 uschar *istemp = US"";
3545 uschar *s = NULL;
a5bd321b 3546 uschar *smtp_code;
059ec3d9
PH
3547 int size = 0;
3548 int sptr = 0;
059ec3d9
PH
3549
3550 errmsg = local_scan_data;
3551
3552 Uunlink(spool_name); /* Cancel this message */
3553 switch(rc)
3554 {
3555 default:
3556 log_write(0, LOG_MAIN, "invalid return %d from local_scan(). Temporary "
3557 "rejection given", rc);
3558 goto TEMPREJECT;
3559
3560 case LOCAL_SCAN_REJECT_NOLOGHDR:
3561 log_extra_selector &= ~LX_rejected_header;
3562 /* Fall through */
3563
3564 case LOCAL_SCAN_REJECT:
a5bd321b 3565 smtp_code = US"550";
059ec3d9
PH
3566 if (errmsg == NULL) errmsg = US"Administrative prohibition";
3567 break;
3568
3569 case LOCAL_SCAN_TEMPREJECT_NOLOGHDR:
3570 log_extra_selector &= ~LX_rejected_header;
3571 /* Fall through */
3572
3573 case LOCAL_SCAN_TEMPREJECT:
3574 TEMPREJECT:
a5bd321b 3575 smtp_code = US"451";
059ec3d9
PH
3576 if (errmsg == NULL) errmsg = US"Temporary local problem";
3577 istemp = US"temporarily ";
3578 break;
3579 }
3580
3581 s = string_append(s, &size, &sptr, 2, US"F=",
3582 (sender_address[0] == 0)? US"<>" : sender_address);
3583 s = add_host_info_for_log(s, &size, &sptr);
3584 s[sptr] = 0;
3585
3586 log_write(0, LOG_MAIN|LOG_REJECT, "%s %srejected by local_scan(): %.256s",
3587 s, istemp, string_printing(errmsg));
3588
3589 if (smtp_input)
3590 {
3591 if (!smtp_batched_input)
3592 {
a5bd321b 3593 smtp_respond(smtp_code, 3, TRUE, errmsg);
059ec3d9
PH
3594 message_id[0] = 0; /* Indicate no message accepted */
3595 smtp_reply = US""; /* Indicate reply already sent */
3596 goto TIDYUP; /* Skip to end of function */
3597 }
3598 else
3599 {
a5bd321b 3600 moan_smtp_batch(NULL, "%s %s", smtp_code, errmsg);
059ec3d9
PH
3601 /* Does not return */
3602 }
3603 }
3604 else
3605 {
3606 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3607 give_local_error(ERRMESS_LOCAL_SCAN, errmsg,
3608 US"message rejected by local scan code: ", error_rc, data_file,
3609 header_list);
3610 /* Does not return */
3611 }
3612 }
3613
3614/* Reset signal handlers to ignore signals that previously would have caused
3615the message to be abandoned. */
3616
3617signal(SIGTERM, SIG_IGN);
3618signal(SIGINT, SIG_IGN);
3619
e4bdf652 3620
059ec3d9
PH
3621/* Ensure the first time flag is set in the newly-received message. */
3622
3623deliver_firsttime = TRUE;
3624
8523533c
TK
3625#ifdef EXPERIMENTAL_BRIGHTMAIL
3626if (bmi_run == 1) {
3627 /* rewind data file */
3628 lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3629 bmi_verdicts = bmi_process_message(header_list, data_fd);
3630};
3631#endif
3632
059ec3d9
PH
3633/* Update the timstamp in our Received: header to account for any time taken by
3634an ACL or by local_scan(). The new time is the time that all reception
3635processing is complete. */
3636
3637timestamp = expand_string(US"${tod_full}");
3638tslen = Ustrlen(timestamp);
3639
3640memcpy(received_header->text + received_header->slen - tslen - 1,
3641 timestamp, tslen);
3642
3643/* In MUA wrapper mode, ignore queueing actions set by ACL or local_scan() */
3644
3645if (mua_wrapper)
3646 {
3647 deliver_freeze = FALSE;
3648 queue_only_policy = FALSE;
3649 }
3650
3651/* Keep the data file open until we have written the header file, in order to
3652hold onto the lock. In a -bh run, or if the message is to be blackholed, we
3653don't write the header file, and we unlink the data file. If writing the header
3654file fails, we have failed to accept this message. */
3655
3656if (host_checking || blackholed_by != NULL)
3657 {
3658 header_line *h;
3659 Uunlink(spool_name);
3660 msg_size = 0; /* Compute size for log line */
3661 for (h = header_list; h != NULL; h = h->next)
3662 if (h->type != '*') msg_size += h->slen;
3663 }
3664
3665/* Write the -H file */
3666
3667else
3668 {
3669 if ((msg_size = spool_write_header(message_id, SW_RECEIVING, &errmsg)) < 0)
3670 {
3671 log_write(0, LOG_MAIN, "Message abandoned: %s", errmsg);
3672 Uunlink(spool_name); /* Lose the data file */
3673
3674 if (smtp_input)
3675 {
3676 smtp_reply = US"451 Error in writing spool file";
3677 message_id[0] = 0; /* Indicate no message accepted */
3678 goto TIDYUP;
3679 }
3680 else
3681 {
3682 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3683 give_local_error(ERRMESS_IOERR, errmsg, US"", error_rc, data_file,
3684 header_list);
3685 /* Does not return */
3686 }
3687 }
3688 }
3689
3690
3691/* The message has now been successfully received. */
3692
3693receive_messagecount++;
3694
3695/* In SMTP sessions we may receive several in one connection. After each one,
3696we wait for the clock to tick at the level of message-id granularity. This is
3697so that the combination of time+pid is unique, even on systems where the pid
3698can be re-used within our time interval. We can't shorten the interval without
3699re-designing the message-id. See comments above where the message id is
3700created. This is Something For The Future. */
3701
3702message_id_tv.tv_usec = (message_id_tv.tv_usec/id_resolution) * id_resolution;
3703exim_wait_tick(&message_id_tv, id_resolution);
3704
3705/* Add data size to written header size. We do not count the initial file name
3706that is in the file, but we do add one extra for the notional blank line that
3707precedes the data. This total differs from message_size in that it include the
3708added Received: header and any other headers that got created locally. */
3709
3710fflush(data_file);
3711fstat(data_fd, &statbuf);
3712
3713msg_size += statbuf.st_size - SPOOL_DATA_START_OFFSET + 1;
3714
3715/* Generate a "message received" log entry. We do this by building up a dynamic
3716string as required. Since we commonly want to add two items at a time, use a
3717macro to simplify the coding. We log the arrival of a new message while the
3718file is still locked, just in case the machine is *really* fast, and delivers
3719it first! Include any message id that is in the message - since the syntax of a
3720message id is actually an addr-spec, we can use the parse routine to canonicize
3721it. */
3722
3723size = 256;
3724sptr = 0;
3725s = store_get(size);
3726
3727s = string_append(s, &size, &sptr, 2, US"<= ",
3728 (sender_address[0] == 0)? US"<>" : sender_address);
3729if (message_reference != NULL)
3730 s = string_append(s, &size, &sptr, 2, US" R=", message_reference);
3731
3732s = add_host_info_for_log(s, &size, &sptr);
3733
3734#ifdef SUPPORT_TLS
8ccd00b1 3735if (log_extra_selector & LX_tls_cipher && tls_in.cipher)
817d9f57 3736 s = string_append(s, &size, &sptr, 2, US" X=", tls_in.cipher);
8ccd00b1 3737if (log_extra_selector & LX_tls_certificate_verified && tls_in.cipher)
059ec3d9 3738 s = string_append(s, &size, &sptr, 2, US" CV=",
817d9f57 3739 tls_in.certificate_verified? "yes":"no");
8ccd00b1 3740if (log_extra_selector & LX_tls_peerdn && tls_in.peerdn)
48ed62d9 3741 s = string_append(s, &size, &sptr, 3, US" DN=\"",
817d9f57 3742 string_printing(tls_in.peerdn), US"\"");
8ccd00b1 3743if (log_extra_selector & LX_tls_sni && tls_in.sni)
3f0945ff 3744 s = string_append(s, &size, &sptr, 3, US" SNI=\"",
817d9f57 3745 string_printing(tls_in.sni), US"\"");
3f0945ff 3746#endif
059ec3d9 3747
8ccd00b1 3748if (sender_host_authenticated)
059ec3d9
PH
3749 {
3750 s = string_append(s, &size, &sptr, 2, US" A=", sender_host_authenticated);
3751 if (authenticated_id != NULL)
c8e2fc1e 3752 {
059ec3d9 3753 s = string_append(s, &size, &sptr, 2, US":", authenticated_id);
c8e2fc1e
JH
3754 if (log_extra_selector & LX_smtp_mailauth && authenticated_sender != NULL)
3755 s = string_append(s, &size, &sptr, 2, US":", authenticated_sender);
3756 }
059ec3d9
PH
3757 }
3758
8ccd00b1 3759#ifndef DISABLE_PRDR
fd98a5c6
JH
3760if (prdr_requested)
3761 s = string_append(s, &size, &sptr, 1, US" PRDR");
3762#endif
8ccd00b1 3763
a3c86431 3764#ifdef EXPERIMENTAL_PROXY
8ccd00b1 3765if (proxy_session && log_extra_selector & LX_proxy)
a3bddaa8 3766 s = string_append(s, &size, &sptr, 2, US" PRX=", proxy_host_address);
a3c86431 3767#endif
fd98a5c6 3768
059ec3d9
PH
3769sprintf(CS big_buffer, "%d", msg_size);
3770s = string_append(s, &size, &sptr, 2, US" S=", big_buffer);
3771
3c0a92dc
JH
3772/* log 8BITMIME mode announced in MAIL_FROM
3773 0 ... no BODY= used
3774 7 ... 7BIT
3775 8 ... 8BITMIME */
c8e2fc1e
JH
3776if (log_extra_selector & LX_8bitmime)
3777 {
3c0a92dc
JH
3778 sprintf(CS big_buffer, "%d", body_8bitmime);
3779 s = string_append(s, &size, &sptr, 2, US" M8S=", big_buffer);
c8e2fc1e 3780 }
3c0a92dc 3781
059ec3d9
PH
3782/* If an addr-spec in a message-id contains a quoted string, it can contain
3783any characters except " \ and CR and so in particular it can contain NL!
3784Therefore, make sure we use a printing-characters only version for the log.
3785Also, allow for domain literals in the message id. */
3786
3787if (msgid_header != NULL)
3788 {
3789 uschar *old_id;
3790 BOOL save_allow_domain_literals = allow_domain_literals;
3791 allow_domain_literals = TRUE;
3792 old_id = parse_extract_address(Ustrchr(msgid_header->text, ':') + 1,
3793 &errmsg, &start, &end, &domain, FALSE);
3794 allow_domain_literals = save_allow_domain_literals;
3795 if (old_id != NULL)
3796 s = string_append(s, &size, &sptr, 2, US" id=", string_printing(old_id));
3797 }
3798
3799/* If subject logging is turned on, create suitable printing-character
3800text. By expanding $h_subject: we make use of the MIME decoding. */
3801
3802if ((log_extra_selector & LX_subject) != 0 && subject_header != NULL)
3803 {
3804 int i;
3805 uschar *p = big_buffer;
3806 uschar *ss = expand_string(US"$h_subject:");
3807
3808 /* Backslash-quote any double quotes or backslashes so as to make a
3809 a C-like string, and turn any non-printers into escape sequences. */
3810
3811 *p++ = '\"';
3812 if (*ss != 0) for (i = 0; i < 100 && ss[i] != 0; i++)
3813 {
3814 if (ss[i] == '\"' || ss[i] == '\\') *p++ = '\\';
3815 *p++ = ss[i];
3816 }
3817 *p++ = '\"';
3818 *p = 0;
3819 s = string_append(s, &size, &sptr, 2, US" T=", string_printing(big_buffer));
3820 }
3821
3822/* Terminate the string: string_cat() and string_append() leave room, but do
3823not put the zero in. */
3824
3825s[sptr] = 0;
3826
059ec3d9
PH
3827/* Create a message log file if message logs are being used and this message is
3828not blackholed. Write the reception stuff to it. We used to leave message log
e4bdf652 3829creation until the first delivery, but this has proved confusing for some
059ec3d9
PH
3830people. */
3831
3832if (message_logs && blackholed_by == NULL)
3833 {
3834 int fd;
3835
3836 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory, message_subdir,
3837 message_id);
3838 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3839
3840 if (fd < 0 && errno == ENOENT)
3841 {
3842 uschar temp[16];
3843 sprintf(CS temp, "msglog/%s", message_subdir);
3844 if (message_subdir[0] == 0) temp[6] = 0;
3845 (void)directory_make(spool_directory, temp, MSGLOG_DIRECTORY_MODE, TRUE);
3846 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3847 }
3848
3849 if (fd < 0)
3850 {
3851 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't open message log %s: %s",
3852 spool_name, strerror(errno));
3853 }
3854
3855 else
3856 {
3857 FILE *message_log = fdopen(fd, "a");
3858 if (message_log == NULL)
3859 {
3860 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't fdopen message log %s: %s",
3861 spool_name, strerror(errno));
f1e894f3 3862 (void)close(fd);
059ec3d9
PH
3863 }
3864 else
3865 {
3866 uschar *now = tod_stamp(tod_log);
3867 fprintf(message_log, "%s Received from %s\n", now, s+3);
3868 if (deliver_freeze) fprintf(message_log, "%s frozen by %s\n", now,
3869 frozen_by);
3870 if (queue_only_policy) fprintf(message_log,
3871 "%s no immediate delivery: queued by %s\n", now, queued_by);
f1e894f3 3872 (void)fclose(message_log);
059ec3d9
PH
3873 }
3874 }
3875 }
3876
58eb016e
PH
3877/* Everything has now been done for a successful message except logging its
3878arrival, and outputting an SMTP response. While writing to the log, set a flag
3879to cause a call to receive_bomb_out() if the log cannot be opened. */
3880
3881receive_call_bombout = TRUE;
3882
563b63fa
PH
3883/* Before sending an SMTP response in a TCP/IP session, we check to see if the
3884connection has gone away. This can only be done if there is no unconsumed input
3885waiting in the local input buffer. We can test for this by calling
3886receive_smtp_buffered(). RFC 2920 (pipelining) explicitly allows for additional
3887input to be sent following the final dot, so the presence of following input is
3888not an error.
58eb016e 3889
563b63fa
PH
3890If the connection is still present, but there is no unread input for the
3891socket, the result of a select() call will be zero. If, however, the connection
3892has gone away, or if there is pending input, the result of select() will be
3893non-zero. The two cases can be distinguished by trying to read the next input
3894character. If we succeed, we can unread it so that it remains in the local
3895buffer for handling later. If not, the connection has been lost.
58eb016e 3896
563b63fa
PH
3897Of course, since TCP/IP is asynchronous, there is always a chance that the
3898connection will vanish between the time of this test and the sending of the
3899response, but the chance of this happening should be small. */
3900
3901if (smtp_input && sender_host_address != NULL && !sender_host_notsocket &&
3902 !receive_smtp_buffered())
58eb016e
PH
3903 {
3904 struct timeval tv;
3905 fd_set select_check;
3906 FD_ZERO(&select_check);
3907 FD_SET(fileno(smtp_in), &select_check);
3908 tv.tv_sec = 0;
3909 tv.tv_usec = 0;
3910
563b63fa 3911 if (select(fileno(smtp_in) + 1, &select_check, NULL, NULL, &tv) != 0)
58eb016e 3912 {
80a47a2c
TK
3913 int c = (receive_getc)();
3914 if (c != EOF) (receive_ungetc)(c); else
58eb016e 3915 {
563b63fa
PH
3916 uschar *msg = US"SMTP connection lost after final dot";
3917 smtp_reply = US""; /* No attempt to send a response */
3918 smtp_yield = FALSE; /* Nothing more on this connection */
58eb016e 3919
563b63fa 3920 /* Re-use the log line workspace */
58eb016e 3921
563b63fa
PH
3922 sptr = 0;
3923 s = string_cat(s, &size, &sptr, msg, Ustrlen(msg));
3924 s = add_host_info_for_log(s, &size, &sptr);
3925 s[sptr] = 0;
3926 log_write(0, LOG_MAIN, "%s", s);
58eb016e 3927
563b63fa 3928 /* Delete the files for this aborted message. */
58eb016e 3929
563b63fa
PH
3930 sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory,
3931 message_subdir, message_id);
3932 Uunlink(spool_name);
58eb016e 3933
563b63fa
PH
3934 sprintf(CS spool_name, "%s/input/%s/%s-H", spool_directory,
3935 message_subdir, message_id);
3936 Uunlink(spool_name);
58eb016e 3937
563b63fa
PH
3938 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory,
3939 message_subdir, message_id);
3940 Uunlink(spool_name);
58eb016e 3941
563b63fa
PH
3942 goto TIDYUP;
3943 }
58eb016e
PH
3944 }
3945 }
3946
3947/* The connection has not gone away; we really are going to take responsibility
3948for this message. */
3949
817d9f57 3950/* Cutthrough - had sender last-dot; assume we've sent (or bufferred) all
e4bdf652
JH
3951 data onward by now.
3952
817d9f57 3953 Send dot onward. If accepted, wipe the spooled files, log as delivered and accept
e4bdf652 3954 the sender's dot (below).
817d9f57
JH
3955 If rejected: copy response to sender, wipe the spooled files, log approriately.
3956 If temp-reject: accept to sender, keep the spooled files.
e4bdf652
JH
3957
3958 Having the normal spool files lets us do data-filtering, and store/forward on temp-reject.
817d9f57
JH
3959
3960 XXX We do not handle queue-only, freezing, or blackholes.
e4bdf652
JH
3961*/
3962if(cutthrough_fd >= 0)
3963 {
3964 uschar * msg= cutthrough_finaldot(); /* Ask the target system to accept the messsage */
817d9f57 3965 /* Logging was done in finaldot() */
e4bdf652 3966 switch(msg[0])
817d9f57
JH
3967 {
3968 case '2': /* Accept. Do the same to the source; dump any spoolfiles. */
b784ce7f 3969 cutthrough_done = ACCEPTED;
817d9f57 3970 break; /* message_id needed for SMTP accept below */
61147df4 3971
817d9f57
JH
3972 default: /* Unknown response, or error. Treat as temp-reject. */
3973 case '4': /* Temp-reject. Keep spoolfiles and accept. */
b784ce7f 3974 cutthrough_done = TMP_REJ; /* Avoid the usual immediate delivery attempt */
817d9f57 3975 break; /* message_id needed for SMTP accept below */
61147df4 3976
817d9f57
JH
3977 case '5': /* Perm-reject. Do the same to the source. Dump any spoolfiles */
3978 smtp_reply= msg; /* Pass on the exact error */
b784ce7f 3979 cutthrough_done = PERM_REJ;
817d9f57
JH
3980 break;
3981 }
e4bdf652 3982 }
58eb016e 3983
8ccd00b1
JH
3984#ifndef DISABLE_PRDR
3985if(!smtp_reply || prdr_requested)
3986#else
3987if(!smtp_reply)
fd98a5c6 3988#endif
e4bdf652
JH
3989 {
3990 log_write(0, LOG_MAIN |
3991 (((log_extra_selector & LX_received_recipients) != 0)? LOG_RECIPIENTS : 0) |
3992 (((log_extra_selector & LX_received_sender) != 0)? LOG_SENDER : 0),
3993 "%s", s);
3994
3995 /* Log any control actions taken by an ACL or local_scan(). */
58eb016e 3996
e4bdf652
JH
3997 if (deliver_freeze) log_write(0, LOG_MAIN, "frozen by %s", frozen_by);
3998 if (queue_only_policy) log_write(L_delay_delivery, LOG_MAIN,
3999 "no immediate delivery: queued by %s", queued_by);
4000 }
4001receive_call_bombout = FALSE;
58eb016e 4002
059ec3d9
PH
4003store_reset(s); /* The store for the main log message can be reused */
4004
4005/* If the message is frozen, and freeze_tell is set, do the telling. */
4006
4007if (deliver_freeze && freeze_tell != NULL && freeze_tell[0] != 0)
4008 {
4009 moan_tell_someone(freeze_tell, NULL, US"Message frozen on arrival",
4010 "Message %s was frozen on arrival by %s.\nThe sender is <%s>.\n",
4011 message_id, frozen_by, sender_address);
4012 }
4013
4014
4015/* Either a message has been successfully received and written to the two spool
4016files, or an error in writing the spool has occurred for an SMTP message, or
58eb016e
PH
4017an SMTP message has been rejected for policy reasons. (For a non-SMTP message
4018we will have already given up because there's no point in carrying on!) In
4019either event, we must now close (and thereby unlock) the data file. In the
059ec3d9
PH
4020successful case, this leaves the message on the spool, ready for delivery. In
4021the error case, the spool file will be deleted. Then tidy up store, interact
4022with an SMTP call if necessary, and return.
4023
4024A fflush() was done earlier in the expectation that any write errors on the
4025data file will be flushed(!) out thereby. Nevertheless, it is theoretically
4026possible for fclose() to fail - but what to do? What has happened to the lock
4027if this happens? */
4028
e4bdf652 4029
059ec3d9 4030TIDYUP:
f1e894f3
PH
4031process_info[process_info_len] = 0; /* Remove message id */
4032if (data_file != NULL) (void)fclose(data_file); /* Frees the lock */
059ec3d9
PH
4033
4034/* Now reset signal handlers to their defaults */
4035
4036signal(SIGTERM, SIG_DFL);
4037signal(SIGINT, SIG_DFL);
4038
4039/* Tell an SMTP caller the state of play, and arrange to return the SMTP return
4040value, which defaults TRUE - meaning there may be more incoming messages from
4041this connection. For non-SMTP callers (where there is only ever one message),
4042the default is FALSE. */
4043
4044if (smtp_input)
4045 {
4046 yield = smtp_yield;
4047
4048 /* Handle interactive SMTP callers. After several kinds of error, smtp_reply
58eb016e
PH
4049 is set to the response that should be sent. When it is NULL, we generate
4050 default responses. After an ACL error or local_scan() error, the response has
4051 already been sent, and smtp_reply is an empty string to indicate this. */
059ec3d9
PH
4052
4053 if (!smtp_batched_input)
4054 {
4055 if (smtp_reply == NULL)
4056 {
29aba418 4057 if (fake_response != OK)
a5bd321b
PH
4058 smtp_respond((fake_response == DEFER)? US"450" : US"550", 3, TRUE,
4059 fake_response_text);
4e88a19f
PH
4060
4061 /* An OK response is required; use "message" text if present. */
4062
4063 else if (user_msg != NULL)
4064 {
4065 uschar *code = US"250";
4066 int len = 3;
4067 smtp_message_code(&code, &len, &user_msg, NULL);
4068 smtp_respond(code, len, TRUE, user_msg);
4069 }
4070
4071 /* Default OK response */
4072
8e669ac1
PH
4073 else
4074 smtp_printf("250 OK id=%s\r\n", message_id);
059ec3d9
PH
4075 if (host_checking)
4076 fprintf(stdout,
4077 "\n**** SMTP testing: that is not a real message id!\n\n");
4078 }
4e88a19f 4079
58eb016e 4080 /* smtp_reply is set non-empty */
4e88a19f 4081
8523533c
TK
4082 else if (smtp_reply[0] != 0)
4083 {
29aba418 4084 if (fake_response != OK && (smtp_reply[0] == '2'))
a5bd321b
PH
4085 smtp_respond((fake_response == DEFER)? US"450" : US"550", 3, TRUE,
4086 fake_response_text);
8e669ac1 4087 else
6951ac6c
PH
4088 smtp_printf("%.1024s\r\n", smtp_reply);
4089 }
e4bdf652 4090
817d9f57
JH
4091 switch (cutthrough_done)
4092 {
b784ce7f
JH
4093 case ACCEPTED: log_write(0, LOG_MAIN, "Completed");/* Delivery was done */
4094 case PERM_REJ: { /* Delete spool files */
817d9f57
JH
4095 sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory,
4096 message_subdir, message_id);
4097 Uunlink(spool_name);
4098 sprintf(CS spool_name, "%s/input/%s/%s-H", spool_directory,
4099 message_subdir, message_id);
4100 Uunlink(spool_name);
4101 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory,
4102 message_subdir, message_id);
4103 Uunlink(spool_name);
4104 }
b784ce7f 4105 case TMP_REJ: message_id[0] = 0; /* Prevent a delivery from starting */
817d9f57 4106 default:break;
e4bdf652 4107 }
817d9f57 4108 cutthrough_delivery = FALSE;
059ec3d9
PH
4109 }
4110
4111 /* For batched SMTP, generate an error message on failure, and do
4112 nothing on success. The function moan_smtp_batch() does not return -
4113 it exits from the program with a non-zero return code. */
4114
4115 else if (smtp_reply != NULL) moan_smtp_batch(NULL, "%s", smtp_reply);
4116 }
4117
4118
4119/* If blackholing, we can immediately log this message's sad fate. The data
4120file has already been unlinked, and the header file was never written to disk.
4121We must now indicate that nothing was received, to prevent a delivery from
4122starting. */
4123
4124if (blackholed_by != NULL)
4125 {
4126 uschar *detail = (local_scan_data != NULL)?
4127 string_printing(local_scan_data) :
4128 string_sprintf("(%s discarded recipients)", blackholed_by);
04f7d5b9 4129 log_write(0, LOG_MAIN, "=> blackhole %s%s", detail, blackhole_log_msg);
059ec3d9
PH
4130 log_write(0, LOG_MAIN, "Completed");
4131 message_id[0] = 0;
4132 }
4133
4134/* Reset headers so that logging of rejects for a subsequent message doesn't
4135include them. It is also important to set header_last = NULL before exiting
4136from this function, as this prevents certain rewrites that might happen during
4137subsequent verifying (of another incoming message) from trying to add headers
4138when they shouldn't. */
4139
4140header_list = header_last = NULL;
4141
4142return yield; /* TRUE if more messages (SMTP only) */
4143}
4144
4145/* End of receive.c */