DMARC documentation and license
[exim.git] / src / src / receive.c
CommitLineData
059ec3d9
PH
1/*************************************************
2* Exim - an Internet mail transport agent *
3*************************************************/
4
c4ceed07 5/* Copyright (c) University of Cambridge 1995 - 2012 */
059ec3d9
PH
6/* See the file NOTICE for conditions of use and distribution. */
7
8/* Code for receiving a message and setting up spool files. */
9
059ec3d9
PH
10#include "exim.h"
11
6a8f9482
TK
12#ifdef EXPERIMENTAL_DCC
13extern int dcc_ok;
14#endif
15
4840604e
TL
16#ifdef EXPERIMENTAL_DMARC
17#include "dmarc.h"
18#endif /* EXPERIMENTAL_DMARC */
19
059ec3d9
PH
20/*************************************************
21* Local static variables *
22*************************************************/
23
24static FILE *data_file = NULL;
25static int data_fd = -1;
26static uschar spool_name[256];
27
28
29
30/*************************************************
31* Non-SMTP character reading functions *
32*************************************************/
33
34/* These are the default functions that are set up in the variables such as
35receive_getc initially. They just call the standard functions, passing stdin as
36the file. (When SMTP input is occurring, different functions are used by
37changing the pointer variables.) */
38
39int
40stdin_getc(void)
41{
42return getc(stdin);
43}
44
45int
46stdin_ungetc(int c)
47{
48return ungetc(c, stdin);
49}
50
51int
52stdin_feof(void)
53{
54return feof(stdin);
55}
56
57int
58stdin_ferror(void)
59{
60return ferror(stdin);
61}
62
63
64
65
66/*************************************************
67* Check that a set sender is allowed *
68*************************************************/
69
70/* This function is called when a local caller sets an explicit sender address.
71It checks whether this is permitted, which it is for trusted callers.
72Otherwise, it must match the pattern(s) in untrusted_set_sender.
73
74Arguments: the proposed sender address
75Returns: TRUE for a trusted caller
76 TRUE if the address has been set, untrusted_set_sender has been
77 set, and the address matches something in the list
78 FALSE otherwise
79*/
80
81BOOL
82receive_check_set_sender(uschar *newsender)
83{
84uschar *qnewsender;
85if (trusted_caller) return TRUE;
86if (newsender == NULL || untrusted_set_sender == NULL) return FALSE;
87qnewsender = (Ustrchr(newsender, '@') != NULL)?
88 newsender : string_sprintf("%s@%s", newsender, qualify_domain_sender);
89return
90 match_address_list(qnewsender, TRUE, TRUE, &untrusted_set_sender, NULL, -1,
91 0, NULL) == OK;
92}
93
94
95
96
97/*************************************************
5cb8cbc6 98* Read space info for a partition *
059ec3d9
PH
99*************************************************/
100
8e669ac1
PH
101/* This function is called by receive_check_fs() below, and also by string
102expansion for variables such as $spool_space. The field names for the statvfs
5cb8cbc6
PH
103structure are macros, because not all OS have F_FAVAIL and it seems tidier to
104have macros for F_BAVAIL and F_FILES as well. Some kinds of file system do not
105have inodes, and they return -1 for the number available.
059ec3d9 106
5cb8cbc6
PH
107Later: It turns out that some file systems that do not have the concept of
108inodes return 0 rather than -1. Such systems should also return 0 for the total
8e669ac1 109number of inodes, so we require that to be greater than zero before returning
5cb8cbc6 110an inode count.
059ec3d9 111
5cb8cbc6
PH
112Arguments:
113 isspool TRUE for spool partition, FALSE for log partition
114 inodeptr address of int to receive inode count; -1 if there isn't one
8e669ac1 115
5cb8cbc6 116Returns: available on-root space, in kilobytes
8e669ac1
PH
117 -1 for log partition if there isn't one
118
119All values are -1 if the STATFS functions are not available.
059ec3d9
PH
120*/
121
8e669ac1 122int
5cb8cbc6 123receive_statvfs(BOOL isspool, int *inodeptr)
059ec3d9
PH
124{
125#ifdef HAVE_STATFS
059ec3d9 126struct STATVFS statbuf;
5cb8cbc6
PH
127uschar *path;
128uschar *name;
129uschar buffer[1024];
059ec3d9 130
5cb8cbc6 131/* The spool directory must always exist. */
059ec3d9 132
5cb8cbc6 133if (isspool)
059ec3d9 134 {
8e669ac1
PH
135 path = spool_directory;
136 name = US"spool";
137 }
138
059ec3d9
PH
139/* Need to cut down the log file path to the directory, and to ignore any
140appearance of "syslog" in it. */
141
5cb8cbc6 142else
059ec3d9 143 {
059ec3d9 144 int sep = ':'; /* Not variable - outside scripts use */
059ec3d9 145 uschar *p = log_file_path;
8e669ac1 146 name = US"log";
059ec3d9
PH
147
148 /* An empty log_file_path means "use the default". This is the same as an
149 empty item in a list. */
150
151 if (*p == 0) p = US":";
152 while ((path = string_nextinlist(&p, &sep, buffer, sizeof(buffer))) != NULL)
153 {
154 if (Ustrcmp(path, "syslog") != 0) break;
155 }
156
5cb8cbc6
PH
157 if (path == NULL) /* No log files */
158 {
8e669ac1
PH
159 *inodeptr = -1;
160 return -1;
161 }
059ec3d9 162
8e669ac1
PH
163 /* An empty string means use the default, which is in the spool directory.
164 But don't just use the spool directory, as it is possible that the log
5cb8cbc6 165 subdirectory has been symbolically linked elsewhere. */
059ec3d9 166
8e669ac1 167 if (path[0] == 0)
059ec3d9 168 {
5cb8cbc6
PH
169 sprintf(CS buffer, CS"%s/log", CS spool_directory);
170 path = buffer;
8e669ac1
PH
171 }
172 else
059ec3d9 173 {
8e669ac1 174 uschar *cp;
5cb8cbc6 175 if ((cp = Ustrrchr(path, '/')) != NULL) *cp = 0;
8e669ac1 176 }
5cb8cbc6 177 }
8e669ac1 178
8f128379 179/* We now have the path; do the business */
5cb8cbc6
PH
180
181memset(&statbuf, 0, sizeof(statbuf));
182
183if (STATVFS(CS path, &statbuf) != 0)
184 {
185 log_write(0, LOG_MAIN|LOG_PANIC, "cannot accept message: failed to stat "
186 "%s directory %s: %s", name, spool_directory, strerror(errno));
187 smtp_closedown(US"spool or log directory problem");
188 exim_exit(EXIT_FAILURE);
189 }
8e669ac1 190
5cb8cbc6
PH
191*inodeptr = (statbuf.F_FILES > 0)? statbuf.F_FAVAIL : -1;
192
193/* Disks are getting huge. Take care with computing the size in kilobytes. */
8e669ac1 194
5cb8cbc6
PH
195return (int)(((double)statbuf.F_BAVAIL * (double)statbuf.F_FRSIZE)/1024.0);
196
197/* Unable to find partition sizes in this environment. */
198
199#else
200*inodeptr = -1;
201return -1;
202#endif
203}
204
059ec3d9 205
059ec3d9 206
5cb8cbc6
PH
207
208/*************************************************
209* Check space on spool and log partitions *
210*************************************************/
211
212/* This function is called before accepting a message; if any thresholds are
213set, it checks them. If a message_size is supplied, it checks that there is
214enough space for that size plus the threshold - i.e. that the message won't
215reduce the space to the threshold. Not all OS have statvfs(); for those that
216don't, this function always returns TRUE. For some OS the old function and
217struct name statfs is used; that is handled by a macro, defined in exim.h.
218
219Arguments:
220 msg_size the (estimated) size of an incoming message
221
222Returns: FALSE if there isn't enough space, or if the information cannot
223 be obtained
224 TRUE if no check was done or there is enough space
225*/
226
227BOOL
228receive_check_fs(int msg_size)
229{
230int space, inodes;
231
232if (check_spool_space > 0 || msg_size > 0 || check_spool_inodes > 0)
233 {
8e669ac1
PH
234 space = receive_statvfs(TRUE, &inodes);
235
059ec3d9 236 DEBUG(D_receive)
5cb8cbc6
PH
237 debug_printf("spool directory space = %dK inodes = %d "
238 "check_space = %dK inodes = %d msg_size = %d\n",
239 space, inodes, check_spool_space, check_spool_inodes, msg_size);
8e669ac1
PH
240
241 if ((space >= 0 && space < check_spool_space) ||
5cb8cbc6 242 (inodes >= 0 && inodes < check_spool_inodes))
8e669ac1 243 {
5cb8cbc6
PH
244 log_write(0, LOG_MAIN, "spool directory space check failed: space=%d "
245 "inodes=%d", space, inodes);
059ec3d9
PH
246 return FALSE;
247 }
248 }
249
5cb8cbc6
PH
250if (check_log_space > 0 || check_log_inodes > 0)
251 {
8e669ac1
PH
252 space = receive_statvfs(FALSE, &inodes);
253
5cb8cbc6
PH
254 DEBUG(D_receive)
255 debug_printf("log directory space = %dK inodes = %d "
256 "check_space = %dK inodes = %d\n",
257 space, inodes, check_log_space, check_log_inodes);
8e669ac1
PH
258
259 if ((space >= 0 && space < check_log_space) ||
5cb8cbc6 260 (inodes >= 0 && inodes < check_log_inodes))
8e669ac1 261 {
5cb8cbc6
PH
262 log_write(0, LOG_MAIN, "log directory space check failed: space=%d "
263 "inodes=%d", space, inodes);
264 return FALSE;
265 }
8e669ac1
PH
266 }
267
059ec3d9
PH
268return TRUE;
269}
270
271
272
273/*************************************************
274* Bomb out while reading a message *
275*************************************************/
276
277/* The common case of wanting to bomb out is if a SIGTERM or SIGINT is
278received, or if there is a timeout. A rarer case might be if the log files are
279screwed up and Exim can't open them to record a message's arrival. Handling
280that case is done by setting a flag to cause the log functions to call this
281function if there is an ultimate disaster. That is why it is globally
282accessible.
283
8f128379
PH
284Arguments:
285 reason text reason to pass to the not-quit ACL
286 msg default SMTP response to give if in an SMTP session
059ec3d9
PH
287Returns: it doesn't
288*/
289
290void
8f128379 291receive_bomb_out(uschar *reason, uschar *msg)
059ec3d9 292{
ead37e6c
PP
293 static BOOL already_bombing_out;
294/* The smtp_notquit_exit() below can call ACLs which can trigger recursive
295timeouts, if someone has something slow in their quit ACL. Since the only
296things we should be doing are to close down cleanly ASAP, on the second
297pass we also close down stuff that might be opened again, before bypassing
298the ACL call and exiting. */
299
059ec3d9
PH
300/* If spool_name is set, it contains the name of the data file that is being
301written. Unlink it before closing so that it cannot be picked up by a delivery
302process. Ensure that any header file is also removed. */
303
ead37e6c 304if (spool_name[0] != '\0')
059ec3d9
PH
305 {
306 Uunlink(spool_name);
307 spool_name[Ustrlen(spool_name) - 1] = 'H';
308 Uunlink(spool_name);
ead37e6c 309 spool_name[0] = '\0';
059ec3d9
PH
310 }
311
312/* Now close the file if it is open, either as a fd or a stream. */
313
ead37e6c
PP
314if (data_file != NULL)
315 {
316 (void)fclose(data_file);
317 data_file = NULL;
318} else if (data_fd >= 0) {
319 (void)close(data_fd);
320 data_fd = -1;
321 }
059ec3d9 322
8f128379
PH
323/* Attempt to close down an SMTP connection tidily. For non-batched SMTP, call
324smtp_notquit_exit(), which runs the NOTQUIT ACL, if present, and handles the
325SMTP response. */
059ec3d9 326
ead37e6c 327if (!already_bombing_out)
059ec3d9 328 {
ead37e6c
PP
329 already_bombing_out = TRUE;
330 if (smtp_input)
331 {
332 if (smtp_batched_input)
333 moan_smtp_batch(NULL, "421 %s - message abandoned", msg); /* No return */
334 smtp_notquit_exit(reason, US"421", US"%s %s - closing connection.",
335 smtp_active_hostname, msg);
336 }
059ec3d9
PH
337 }
338
339/* Exit from the program (non-BSMTP cases) */
340
341exim_exit(EXIT_FAILURE);
342}
343
344
345/*************************************************
346* Data read timeout *
347*************************************************/
348
349/* Handler function for timeouts that occur while reading the data that
350comprises a message.
351
352Argument: the signal number
353Returns: nothing
354*/
355
356static void
357data_timeout_handler(int sig)
358{
359uschar *msg = NULL;
360
361sig = sig; /* Keep picky compilers happy */
362
363if (smtp_input)
364 {
365 msg = US"SMTP incoming data timeout";
366 log_write(L_lost_incoming_connection,
367 LOG_MAIN, "SMTP data timeout (message abandoned) on connection "
fed77020
PH
368 "from %s F=<%s>",
369 (sender_fullhost != NULL)? sender_fullhost : US"local process",
370 sender_address);
059ec3d9
PH
371 }
372else
373 {
374 fprintf(stderr, "exim: timed out while reading - message abandoned\n");
375 log_write(L_lost_incoming_connection,
376 LOG_MAIN, "timed out while reading local message");
377 }
378
8f128379 379receive_bomb_out(US"data-timeout", msg); /* Does not return */
059ec3d9
PH
380}
381
382
383
384/*************************************************
385* local_scan() timeout *
386*************************************************/
387
388/* Handler function for timeouts that occur while running a local_scan()
389function.
390
391Argument: the signal number
392Returns: nothing
393*/
394
395static void
396local_scan_timeout_handler(int sig)
397{
398sig = sig; /* Keep picky compilers happy */
399log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function timed out - "
400 "message temporarily rejected (size %d)", message_size);
8f128379
PH
401/* Does not return */
402receive_bomb_out(US"local-scan-timeout", US"local verification problem");
059ec3d9
PH
403}
404
405
406
407/*************************************************
408* local_scan() crashed *
409*************************************************/
410
411/* Handler function for signals that occur while running a local_scan()
412function.
413
414Argument: the signal number
415Returns: nothing
416*/
417
418static void
419local_scan_crash_handler(int sig)
420{
421log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function crashed with "
422 "signal %d - message temporarily rejected (size %d)", sig, message_size);
8f128379
PH
423/* Does not return */
424receive_bomb_out(US"local-scan-error", US"local verification problem");
059ec3d9
PH
425}
426
427
428/*************************************************
429* SIGTERM or SIGINT received *
430*************************************************/
431
432/* Handler for SIGTERM or SIGINT signals that occur while reading the
433data that comprises a message.
434
435Argument: the signal number
436Returns: nothing
437*/
438
439static void
440data_sigterm_sigint_handler(int sig)
441{
442uschar *msg = NULL;
443
444if (smtp_input)
445 {
446 msg = US"Service not available - SIGTERM or SIGINT received";
447 log_write(0, LOG_MAIN, "%s closed after %s", smtp_get_connection_info(),
448 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
449 }
450else
451 {
f05da2e8 452 if (filter_test == FTEST_NONE)
059ec3d9
PH
453 {
454 fprintf(stderr, "\nexim: %s received - message abandoned\n",
455 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
456 log_write(0, LOG_MAIN, "%s received while reading local message",
457 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
458 }
459 }
460
8f128379 461receive_bomb_out(US"signal-exit", msg); /* Does not return */
059ec3d9
PH
462}
463
464
465
466/*************************************************
467* Add new recipient to list *
468*************************************************/
469
470/* This function builds a list of recipient addresses in argc/argv
471format.
472
473Arguments:
474 recipient the next address to add to recipients_list
475 pno parent number for fixed aliases; -1 otherwise
476
477Returns: nothing
478*/
479
480void
481receive_add_recipient(uschar *recipient, int pno)
482{
483if (recipients_count >= recipients_list_max)
484 {
485 recipient_item *oldlist = recipients_list;
486 int oldmax = recipients_list_max;
487 recipients_list_max = recipients_list_max? 2*recipients_list_max : 50;
488 recipients_list = store_get(recipients_list_max * sizeof(recipient_item));
489 if (oldlist != NULL)
490 memcpy(recipients_list, oldlist, oldmax * sizeof(recipient_item));
491 }
492
493recipients_list[recipients_count].address = recipient;
494recipients_list[recipients_count].pno = pno;
8523533c
TK
495#ifdef EXPERIMENTAL_BRIGHTMAIL
496recipients_list[recipients_count].bmi_optin = bmi_current_optin;
497/* reset optin string pointer for next recipient */
498bmi_current_optin = NULL;
499#endif
059ec3d9
PH
500recipients_list[recipients_count++].errors_to = NULL;
501}
502
503
504
505
fd98a5c6
JH
506/*************************************************
507* Send user response message *
508*************************************************/
61147df4 509
fd98a5c6
JH
510/* This function is passed a default response code and a user message. It calls
511smtp_message_code() to check and possibly modify the response code, and then
512calls smtp_respond() to transmit the response. I put this into a function
513just to avoid a lot of repetition.
61147df4
PP
514
515Arguments:
fd98a5c6
JH
516 code the response code
517 user_msg the user message
518
519Returns: nothing
61147df4
PP
520*/
521
522#ifdef EXPERIMENTAL_PRDR
523static void
fd98a5c6 524smtp_user_msg(uschar *code, uschar *user_msg)
61147df4 525{
fd98a5c6
JH
526int len = 3;
527smtp_message_code(&code, &len, &user_msg, NULL);
528smtp_respond(code, len, TRUE, user_msg);
61147df4
PP
529}
530#endif
531
532
533
534
fd98a5c6 535
059ec3d9
PH
536/*************************************************
537* Remove a recipient from the list *
538*************************************************/
539
540/* This function is provided for local_scan() to use.
541
542Argument:
543 recipient address to remove
544
545Returns: TRUE if it did remove something; FALSE otherwise
546*/
547
548BOOL
549receive_remove_recipient(uschar *recipient)
550{
551int count;
552DEBUG(D_receive) debug_printf("receive_remove_recipient(\"%s\") called\n",
553 recipient);
554for (count = 0; count < recipients_count; count++)
555 {
556 if (Ustrcmp(recipients_list[count].address, recipient) == 0)
557 {
558 if ((--recipients_count - count) > 0)
559 memmove(recipients_list + count, recipients_list + count + 1,
54cdb463 560 (recipients_count - count)*sizeof(recipient_item));
059ec3d9
PH
561 return TRUE;
562 }
563 }
564return FALSE;
565}
566
567
568
569
570
571/*************************************************
572* Read data portion of a non-SMTP message *
573*************************************************/
574
575/* This function is called to read the remainder of a message (following the
576header) when the input is not from SMTP - we are receiving a local message on
577a standard input stream. The message is always terminated by EOF, and is also
578terminated by a dot on a line by itself if the flag dot_ends is TRUE. Split the
579two cases for maximum efficiency.
580
581Ensure that the body ends with a newline. This will naturally be the case when
582the termination is "\n.\n" but may not be otherwise. The RFC defines messages
583as "sequences of lines" - this of course strictly applies only to SMTP, but
584deliveries into BSD-type mailbox files also require it. Exim used to have a
585flag for doing this at delivery time, but as it was always set for all
586transports, I decided to simplify things by putting the check here instead.
587
588There is at least one MUA (dtmail) that sends CRLF via this interface, and
589other programs are known to do this as well. Exim used to have a option for
590dealing with this: in July 2003, after much discussion, the code has been
591changed to default to treat any of LF, CRLF, and bare CR as line terminators.
592
593However, for the case when a dot on a line by itself terminates a message, the
594only recognized terminating sequences before and after the dot are LF and CRLF.
595Otherwise, having read EOL . CR, you don't know whether to read another
596character or not.
597
598Internally, in messages stored in Exim's spool files, LF is used as the line
599terminator. Under the new regime, bare CRs will no longer appear in these
600files.
601
602Arguments:
603 fout a FILE to which to write the message
604
605Returns: One of the END_xxx values indicating why it stopped reading
606*/
607
608static int
609read_message_data(FILE *fout)
610{
611int ch_state;
612register int ch;
d677b2f2 613register int linelength = 0;
059ec3d9
PH
614
615/* Handle the case when only EOF terminates the message */
616
617if (!dot_ends)
618 {
619 register int last_ch = '\n';
620
80a47a2c 621 for (; (ch = (receive_getc)()) != EOF; last_ch = ch)
059ec3d9
PH
622 {
623 if (ch == 0) body_zerocount++;
624 if (last_ch == '\r' && ch != '\n')
625 {
d677b2f2
PH
626 if (linelength > max_received_linelength)
627 max_received_linelength = linelength;
628 linelength = 0;
059ec3d9
PH
629 if (fputc('\n', fout) == EOF) return END_WERROR;
630 message_size++;
631 body_linecount++;
632 }
633 if (ch == '\r') continue;
634
635 if (fputc(ch, fout) == EOF) return END_WERROR;
d677b2f2
PH
636 if (ch == '\n')
637 {
638 if (linelength > max_received_linelength)
639 max_received_linelength = linelength;
640 linelength = 0;
641 body_linecount++;
642 }
643 else linelength++;
059ec3d9
PH
644 if (++message_size > thismessage_size_limit) return END_SIZE;
645 }
646
647 if (last_ch != '\n')
648 {
d677b2f2
PH
649 if (linelength > max_received_linelength)
650 max_received_linelength = linelength;
059ec3d9
PH
651 if (fputc('\n', fout) == EOF) return END_WERROR;
652 message_size++;
653 body_linecount++;
654 }
655
656 return END_EOF;
657 }
658
659/* Handle the case when a dot on a line on its own, or EOF, terminates. */
660
661ch_state = 1;
662
80a47a2c 663while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
664 {
665 if (ch == 0) body_zerocount++;
666 switch (ch_state)
667 {
668 case 0: /* Normal state (previous char written) */
669 if (ch == '\n')
d677b2f2
PH
670 {
671 body_linecount++;
672 if (linelength > max_received_linelength)
673 max_received_linelength = linelength;
674 linelength = -1;
675 ch_state = 1;
676 }
059ec3d9
PH
677 else if (ch == '\r')
678 { ch_state = 2; continue; }
679 break;
680
681 case 1: /* After written "\n" */
682 if (ch == '.') { ch_state = 3; continue; }
d677b2f2 683 if (ch != '\n') ch_state = 0; else linelength = -1;
059ec3d9
PH
684 break;
685
686 case 2:
687 body_linecount++; /* After unwritten "\r" */
d677b2f2
PH
688 if (linelength > max_received_linelength)
689 max_received_linelength = linelength;
059ec3d9 690 if (ch == '\n')
d677b2f2
PH
691 {
692 ch_state = 1;
693 linelength = -1;
694 }
059ec3d9
PH
695 else
696 {
697 if (message_size++, fputc('\n', fout) == EOF) return END_WERROR;
698 if (ch == '\r') continue;
699 ch_state = 0;
d677b2f2 700 linelength = 0;
059ec3d9
PH
701 }
702 break;
703
704 case 3: /* After "\n." (\n written, dot not) */
705 if (ch == '\n') return END_DOT;
706 if (ch == '\r') { ch_state = 4; continue; }
707 message_size++;
d677b2f2 708 linelength++;
059ec3d9
PH
709 if (fputc('.', fout) == EOF) return END_WERROR;
710 ch_state = 0;
711 break;
712
713 case 4: /* After "\n.\r" (\n written, rest not) */
714 if (ch == '\n') return END_DOT;
715 message_size += 2;
716 body_linecount++;
717 if (fputs(".\n", fout) == EOF) return END_WERROR;
718 if (ch == '\r') { ch_state = 2; continue; }
719 ch_state = 0;
720 break;
721 }
722
d677b2f2 723 linelength++;
059ec3d9
PH
724 if (fputc(ch, fout) == EOF) return END_WERROR;
725 if (++message_size > thismessage_size_limit) return END_SIZE;
726 }
727
728/* Get here if EOF read. Unless we have just written "\n", we need to ensure
729the message ends with a newline, and we must also write any characters that
730were saved up while testing for an ending dot. */
731
732if (ch_state != 1)
733 {
734 static uschar *ends[] = { US"\n", NULL, US"\n", US".\n", US".\n" };
735 if (fputs(CS ends[ch_state], fout) == EOF) return END_WERROR;
736 message_size += Ustrlen(ends[ch_state]);
737 body_linecount++;
738 }
739
740return END_EOF;
741}
742
743
744
745
746/*************************************************
747* Read data portion of an SMTP message *
748*************************************************/
749
750/* This function is called to read the remainder of an SMTP message (after the
751headers), or to skip over it when an error has occurred. In this case, the
752output file is passed as NULL.
753
754If any line begins with a dot, that character is skipped. The input should only
755be successfully terminated by CR LF . CR LF unless it is local (non-network)
756SMTP, in which case the CRs are optional, but...
757
758FUDGE: It seems that sites on the net send out messages with just LF
759terminators, despite the warnings in the RFCs, and other MTAs handle this. So
760we make the CRs optional in all cases.
761
762July 2003: Bare CRs cause trouble. We now treat them as line terminators as
763well, so that there are no CRs in spooled messages. However, the message
764terminating dot is not recognized between two bare CRs.
765
766Arguments:
767 fout a FILE to which to write the message; NULL if skipping
768
769Returns: One of the END_xxx values indicating why it stopped reading
770*/
771
772static int
773read_message_data_smtp(FILE *fout)
774{
775int ch_state = 0;
e4bdf652 776int ch;
1f5497b2 777register int linelength = 0;
059ec3d9 778
80a47a2c 779while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
780 {
781 if (ch == 0) body_zerocount++;
782 switch (ch_state)
783 {
784 case 0: /* After LF or CRLF */
785 if (ch == '.')
786 {
787 ch_state = 3;
788 continue; /* Don't ever write . after LF */
789 }
790 ch_state = 1;
791
792 /* Else fall through to handle as normal uschar. */
793
794 case 1: /* Normal state */
795 if (ch == '\n')
796 {
797 ch_state = 0;
798 body_linecount++;
1f5497b2
PH
799 if (linelength > max_received_linelength)
800 max_received_linelength = linelength;
801 linelength = -1;
059ec3d9
PH
802 }
803 else if (ch == '\r')
804 {
805 ch_state = 2;
806 continue;
807 }
808 break;
809
810 case 2: /* After (unwritten) CR */
811 body_linecount++;
1f5497b2
PH
812 if (linelength > max_received_linelength)
813 max_received_linelength = linelength;
814 linelength = -1;
059ec3d9
PH
815 if (ch == '\n')
816 {
817 ch_state = 0;
818 }
819 else
820 {
821 message_size++;
822 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 823 (void) cutthrough_put_nl();
059ec3d9
PH
824 if (ch != '\r') ch_state = 1; else continue;
825 }
826 break;
827
828 case 3: /* After [CR] LF . */
829 if (ch == '\n')
830 return END_DOT;
831 if (ch == '\r')
832 {
833 ch_state = 4;
834 continue;
835 }
836 ch_state = 1; /* The dot itself is removed */
837 break;
838
839 case 4: /* After [CR] LF . CR */
840 if (ch == '\n') return END_DOT;
841 message_size++;
842 body_linecount++;
843 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 844 (void) cutthrough_put_nl();
059ec3d9
PH
845 if (ch == '\r')
846 {
847 ch_state = 2;
848 continue;
849 }
850 ch_state = 1;
851 break;
852 }
853
854 /* Add the character to the spool file, unless skipping; then loop for the
855 next. */
856
857 message_size++;
1f5497b2 858 linelength++;
059ec3d9
PH
859 if (fout != NULL)
860 {
861 if (fputc(ch, fout) == EOF) return END_WERROR;
862 if (message_size > thismessage_size_limit) return END_SIZE;
863 }
e4bdf652
JH
864 if(ch == '\n')
865 (void) cutthrough_put_nl();
866 else
867 {
868 uschar c= ch;
869 (void) cutthrough_puts(&c, 1);
870 }
059ec3d9
PH
871 }
872
873/* Fall through here if EOF encountered. This indicates some kind of error,
874since a correct message is terminated by [CR] LF . [CR] LF. */
875
876return END_EOF;
877}
878
879
880
881
882/*************************************************
883* Swallow SMTP message *
884*************************************************/
885
886/* This function is called when there has been some kind of error while reading
887an SMTP message, and the remaining data may need to be swallowed. It is global
888because it is called from smtp_closedown() to shut down an incoming call
889tidily.
890
891Argument: a FILE from which to read the message
892Returns: nothing
893*/
894
895void
896receive_swallow_smtp(void)
897{
898if (message_ended >= END_NOTENDED)
899 message_ended = read_message_data_smtp(NULL);
900}
901
902
903
904/*************************************************
905* Handle lost SMTP connection *
906*************************************************/
907
908/* This function logs connection loss incidents and generates an appropriate
909SMTP response.
910
911Argument: additional data for the message
912Returns: the SMTP response
913*/
914
915static uschar *
916handle_lost_connection(uschar *s)
917{
918log_write(L_lost_incoming_connection | L_smtp_connection, LOG_MAIN,
919 "%s lost while reading message data%s", smtp_get_connection_info(), s);
920return US"421 Lost incoming connection";
921}
922
923
924
925
926/*************************************************
927* Handle a non-smtp reception error *
928*************************************************/
929
930/* This function is called for various errors during the reception of non-SMTP
931messages. It either sends a message to the sender of the problem message, or it
932writes to the standard error stream.
933
934Arguments:
935 errcode code for moan_to_sender(), identifying the error
936 text1 first message text, passed to moan_to_sender()
937 text2 second message text, used only for stderrr
938 error_rc code to pass to exim_exit if no problem
939 f FILE containing body of message (may be stdin)
940 hptr pointer to instore headers or NULL
941
942Returns: calls exim_exit(), which does not return
943*/
944
945static void
946give_local_error(int errcode, uschar *text1, uschar *text2, int error_rc,
947 FILE *f, header_line *hptr)
948{
949if (error_handling == ERRORS_SENDER)
950 {
951 error_block eblock;
952 eblock.next = NULL;
953 eblock.text1 = text1;
954 if (!moan_to_sender(errcode, &eblock, hptr, f, FALSE))
955 error_rc = EXIT_FAILURE;
956 }
957else fprintf(stderr, "exim: %s%s\n", text2, text1); /* Sic */
f1e894f3 958(void)fclose(f);
059ec3d9
PH
959exim_exit(error_rc);
960}
961
962
963
964/*************************************************
965* Add header lines set up by ACL *
966*************************************************/
967
850635b6
PH
968/* This function is called to add the header lines that were set up by
969statements in an ACL to the list of headers in memory. It is done in two stages
970like this, because when the ACL for RCPT is running, the other headers have not
971yet been received. This function is called twice; once just before running the
972DATA ACL, and once after. This is so that header lines added by MAIL or RCPT
973are visible to the DATA ACL.
059ec3d9
PH
974
975Originally these header lines were added at the end. Now there is support for
976three different places: top, bottom, and after the Received: header(s). There
977will always be at least one Received: header, even if it is marked deleted, and
978even if something else has been put in front of it.
979
980Arguments:
981 acl_name text to identify which ACL
982
983Returns: nothing
984*/
985
986static void
987add_acl_headers(uschar *acl_name)
988{
989header_line *h, *next;
990header_line *last_received = NULL;
e7568d51
TL
991
992if (acl_removed_headers != NULL)
993 {
994 DEBUG(D_receive|D_acl) debug_printf(">>Headers removed by %s ACL:\n", acl_name);
995
996 for (h = header_list; h != NULL; h = h->next)
997 {
e7568d51
TL
998 uschar *list;
999 BOOL include_header;
1000
1001 if (h->type == htype_old) continue;
1002
1003 include_header = TRUE;
1004 list = acl_removed_headers;
1005
1006 int sep = ':'; /* This is specified as a colon-separated list */
1007 uschar *s;
1008 uschar buffer[128];
1009 while ((s = string_nextinlist(&list, &sep, buffer, sizeof(buffer)))
1010 != NULL)
1011 {
1012 int len = Ustrlen(s);
1013 if (header_testname(h, s, len, FALSE))
1014 {
1015 h->type = htype_old;
1016 DEBUG(D_receive|D_acl) debug_printf(" %s", h->text);
1017 }
1018 }
1019 }
1020 acl_removed_headers = NULL;
1021 DEBUG(D_receive|D_acl) debug_printf(">>\n");
1022 }
059ec3d9 1023
71fafd95 1024if (acl_added_headers == NULL) return;
059ec3d9
PH
1025DEBUG(D_receive|D_acl) debug_printf(">>Headers added by %s ACL:\n", acl_name);
1026
71fafd95 1027for (h = acl_added_headers; h != NULL; h = next)
059ec3d9
PH
1028 {
1029 next = h->next;
1030
1031 switch(h->type)
1032 {
1033 case htype_add_top:
1034 h->next = header_list;
1035 header_list = h;
1036 DEBUG(D_receive|D_acl) debug_printf(" (at top)");
1037 break;
1038
1039 case htype_add_rec:
1040 if (last_received == NULL)
1041 {
1042 last_received = header_list;
1043 while (!header_testname(last_received, US"Received", 8, FALSE))
1044 last_received = last_received->next;
1045 while (last_received->next != NULL &&
1046 header_testname(last_received->next, US"Received", 8, FALSE))
1047 last_received = last_received->next;
1048 }
1049 h->next = last_received->next;
1050 last_received->next = h;
1051 DEBUG(D_receive|D_acl) debug_printf(" (after Received:)");
1052 break;
1053
8523533c
TK
1054 case htype_add_rfc:
1055 /* add header before any header which is NOT Received: or Resent- */
1056 last_received = header_list;
1057 while ( (last_received->next != NULL) &&
1058 ( (header_testname(last_received->next, US"Received", 8, FALSE)) ||
1059 (header_testname_incomplete(last_received->next, US"Resent-", 7, FALSE)) ) )
1060 last_received = last_received->next;
1061 /* last_received now points to the last Received: or Resent-* header
1062 in an uninterrupted chain of those header types (seen from the beginning
1063 of all headers. Our current header must follow it. */
1064 h->next = last_received->next;
1065 last_received->next = h;
8e669ac1 1066 DEBUG(D_receive|D_acl) debug_printf(" (before any non-Received: or Resent-*: header)");
8523533c
TK
1067 break;
1068
059ec3d9
PH
1069 default:
1070 h->next = NULL;
1071 header_last->next = h;
1072 break;
1073 }
1074
1075 if (h->next == NULL) header_last = h;
1076
1077 /* Check for one of the known header types (From:, To:, etc.) though in
1078 practice most added headers are going to be "other". Lower case
1079 identification letters are never stored with the header; they are used
1080 for existence tests when messages are received. So discard any lower case
1081 flag values. */
1082
1083 h->type = header_checkname(h, FALSE);
1084 if (h->type >= 'a') h->type = htype_other;
1085
1086 DEBUG(D_receive|D_acl) debug_printf(" %s", header_last->text);
1087 }
1088
71fafd95 1089acl_added_headers = NULL;
059ec3d9
PH
1090DEBUG(D_receive|D_acl) debug_printf(">>\n");
1091}
1092
1093
1094
1095/*************************************************
1096* Add host information for log line *
1097*************************************************/
1098
1099/* Called for acceptance and rejecting log lines. This adds information about
1100the calling host to a string that is being built dynamically.
1101
1102Arguments:
1103 s the dynamic string
1104 sizeptr points to the size variable
1105 ptrptr points to the pointer variable
1106
1107Returns: the extended string
1108*/
1109
1110static uschar *
1111add_host_info_for_log(uschar *s, int *sizeptr, int *ptrptr)
1112{
1113if (sender_fullhost != NULL)
1114 {
1115 s = string_append(s, sizeptr, ptrptr, 2, US" H=", sender_fullhost);
1116 if ((log_extra_selector & LX_incoming_interface) != 0 &&
1117 interface_address != NULL)
1118 {
1119 uschar *ss = string_sprintf(" I=[%s]:%d", interface_address,
1120 interface_port);
1121 s = string_cat(s, sizeptr, ptrptr, ss, Ustrlen(ss));
1122 }
1123 }
1124if (sender_ident != NULL)
1125 s = string_append(s, sizeptr, ptrptr, 2, US" U=", sender_ident);
1126if (received_protocol != NULL)
1127 s = string_append(s, sizeptr, ptrptr, 2, US" P=", received_protocol);
1128return s;
1129}
1130
1131
1132
63955bf2 1133#ifdef WITH_CONTENT_SCAN
059ec3d9 1134
54cdb463
PH
1135/*************************************************
1136* Run the MIME ACL on a message *
1137*************************************************/
1138
1139/* This code is in a subroutine so that it can be used for both SMTP
1140and non-SMTP messages. It is called with a non-NULL ACL pointer.
1141
1142Arguments:
1143 acl The ACL to run (acl_smtp_mime or acl_not_smtp_mime)
1144 smtp_yield_ptr Set FALSE to kill messages after dropped connection
1145 smtp_reply_ptr Where SMTP reply is being built
1146 blackholed_by_ptr Where "blackholed by" message is being built
1147
1148Returns: TRUE to carry on; FALSE to abandon the message
1149*/
1150
1151static BOOL
1152run_mime_acl(uschar *acl, BOOL *smtp_yield_ptr, uschar **smtp_reply_ptr,
1153 uschar **blackholed_by_ptr)
1154{
1155FILE *mbox_file;
1156uschar rfc822_file_path[2048];
1157unsigned long mbox_size;
1158header_line *my_headerlist;
1159uschar *user_msg, *log_msg;
1160int mime_part_count_buffer = -1;
7156b1ef 1161int rc = OK;
54cdb463
PH
1162
1163memset(CS rfc822_file_path,0,2048);
1164
1165/* check if it is a MIME message */
1166my_headerlist = header_list;
4e88a19f
PH
1167while (my_headerlist != NULL)
1168 {
54cdb463 1169 /* skip deleted headers */
4e88a19f
PH
1170 if (my_headerlist->type == '*')
1171 {
54cdb463
PH
1172 my_headerlist = my_headerlist->next;
1173 continue;
4e88a19f
PH
1174 }
1175 if (strncmpic(my_headerlist->text, US"Content-Type:", 13) == 0)
1176 {
54cdb463
PH
1177 DEBUG(D_receive) debug_printf("Found Content-Type: header - executing acl_smtp_mime.\n");
1178 goto DO_MIME_ACL;
4e88a19f 1179 }
54cdb463 1180 my_headerlist = my_headerlist->next;
4e88a19f 1181 }
54cdb463
PH
1182
1183DEBUG(D_receive) debug_printf("No Content-Type: header - presumably not a MIME message.\n");
1184return TRUE;
1185
1186DO_MIME_ACL:
1187/* make sure the eml mbox file is spooled up */
8544e77a 1188mbox_file = spool_mbox(&mbox_size, NULL);
54cdb463
PH
1189if (mbox_file == NULL) {
1190 /* error while spooling */
1191 log_write(0, LOG_MAIN|LOG_PANIC,
1192 "acl_smtp_mime: error while creating mbox spool file, message temporarily rejected.");
1193 Uunlink(spool_name);
1194 unspool_mbox();
6f0c431a
PP
1195#ifdef EXPERIMENTAL_DCC
1196 dcc_ok = 0;
1197#endif
a5bd321b 1198 smtp_respond(US"451", 3, TRUE, US"temporary local problem");
54cdb463
PH
1199 message_id[0] = 0; /* Indicate no message accepted */
1200 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1201 return FALSE; /* Indicate skip to end of receive function */
1202};
1203
1204mime_is_rfc822 = 0;
1205
1206MIME_ACL_CHECK:
1207mime_part_count = -1;
1208rc = mime_acl_check(acl, mbox_file, NULL, &user_msg, &log_msg);
f1e894f3 1209(void)fclose(mbox_file);
54cdb463 1210
4e88a19f
PH
1211if (Ustrlen(rfc822_file_path) > 0)
1212 {
54cdb463
PH
1213 mime_part_count = mime_part_count_buffer;
1214
4e88a19f
PH
1215 if (unlink(CS rfc822_file_path) == -1)
1216 {
54cdb463
PH
1217 log_write(0, LOG_PANIC,
1218 "acl_smtp_mime: can't unlink RFC822 spool file, skipping.");
1219 goto END_MIME_ACL;
4e88a19f
PH
1220 }
1221 }
54cdb463
PH
1222
1223/* check if we must check any message/rfc822 attachments */
4e88a19f
PH
1224if (rc == OK)
1225 {
54cdb463
PH
1226 uschar temp_path[1024];
1227 int n;
1228 struct dirent *entry;
1229 DIR *tempdir;
1230
b07e6aa3
PH
1231 (void)string_format(temp_path, 1024, "%s/scan/%s", spool_directory,
1232 message_id);
54cdb463 1233
4e88a19f
PH
1234 tempdir = opendir(CS temp_path);
1235 n = 0;
1236 do
1237 {
1238 entry = readdir(tempdir);
1239 if (entry == NULL) break;
1240 if (strncmpic(US entry->d_name,US"__rfc822_",9) == 0)
1241 {
b07e6aa3 1242 (void)string_format(rfc822_file_path, 2048,"%s/scan/%s/%s", spool_directory, message_id, entry->d_name);
4e88a19f
PH
1243 debug_printf("RFC822 attachment detected: running MIME ACL for '%s'\n", rfc822_file_path);
1244 break;
1245 }
1246 } while (1);
1247 closedir(tempdir);
54cdb463 1248
4e88a19f
PH
1249 if (entry != NULL)
1250 {
c58b88df 1251 mbox_file = Ufopen(rfc822_file_path,"rb");
4e88a19f
PH
1252 if (mbox_file == NULL)
1253 {
54cdb463
PH
1254 log_write(0, LOG_PANIC,
1255 "acl_smtp_mime: can't open RFC822 spool file, skipping.");
1256 unlink(CS rfc822_file_path);
1257 goto END_MIME_ACL;
4e88a19f 1258 }
54cdb463
PH
1259 /* set RFC822 expansion variable */
1260 mime_is_rfc822 = 1;
1261 mime_part_count_buffer = mime_part_count;
1262 goto MIME_ACL_CHECK;
4e88a19f
PH
1263 }
1264 }
54cdb463
PH
1265
1266END_MIME_ACL:
1267add_acl_headers(US"MIME");
1268if (rc == DISCARD)
1269 {
1270 recipients_count = 0;
1271 *blackholed_by_ptr = US"MIME ACL";
1272 }
1273else if (rc != OK)
1274 {
1275 Uunlink(spool_name);
1276 unspool_mbox();
6f0c431a
PP
1277#ifdef EXPERIMENTAL_DCC
1278 dcc_ok = 0;
1279#endif
54cdb463
PH
1280 if (smtp_handle_acl_fail(ACL_WHERE_MIME, rc, user_msg, log_msg) != 0)
1281 *smtp_yield_ptr = FALSE; /* No more messsages after dropped connection */
1282 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1283 message_id[0] = 0; /* Indicate no message accepted */
1284 return FALSE; /* Cause skip to end of receive function */
4e88a19f 1285 }
54cdb463
PH
1286
1287return TRUE;
1288}
1289
63955bf2 1290#endif /* WITH_CONTENT_SCAN */
54cdb463
PH
1291
1292
e4bdf652
JH
1293
1294void
1295received_header_gen(void)
1296{
1297uschar *received;
1298uschar *timestamp;
1299header_line *received_header= header_list;
1300
1301timestamp = expand_string(US"${tod_full}");
1302if (recipients_count == 1) received_for = recipients_list[0].address;
1303received = expand_string(received_header_text);
1304received_for = NULL;
1305
1306if (received == NULL)
1307 {
1308 if(spool_name[0] != 0)
1309 Uunlink(spool_name); /* Lose the data file */
1310 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Expansion of \"%s\" "
1311 "(received_header_text) failed: %s", string_printing(received_header_text),
1312 expand_string_message);
1313 }
1314
1315/* The first element on the header chain is reserved for the Received header,
1316so all we have to do is fill in the text pointer, and set the type. However, if
1317the result of the expansion is an empty string, we leave the header marked as
1318"old" so as to refrain from adding a Received header. */
1319
1320if (received[0] == 0)
1321 {
1322 received_header->text = string_sprintf("Received: ; %s\n", timestamp);
1323 received_header->type = htype_old;
1324 }
1325else
1326 {
1327 received_header->text = string_sprintf("%s; %s\n", received, timestamp);
1328 received_header->type = htype_received;
1329 }
1330
1331received_header->slen = Ustrlen(received_header->text);
1332
1333DEBUG(D_receive) debug_printf(">>Generated Received: header line\n%c %s",
1334 received_header->type, received_header->text);
1335}
1336
1337
1338
059ec3d9
PH
1339/*************************************************
1340* Receive message *
1341*************************************************/
1342
1343/* Receive a message on the given input, and put it into a pair of spool files.
1344Either a non-null list of recipients, or the extract flag will be true, or
1345both. The flag sender_local is true for locally generated messages. The flag
1346submission_mode is true if an ACL has obeyed "control = submission". The flag
8800895a 1347suppress_local_fixups is true if an ACL has obeyed "control =
f4ee74ac
PP
1348suppress_local_fixups" or -G was passed on the command-line.
1349The flag smtp_input is true if the message is to be
8800895a
PH
1350handled using SMTP conventions about termination and lines starting with dots.
1351For non-SMTP messages, dot_ends is true for dot-terminated messages.
059ec3d9
PH
1352
1353If a message was successfully read, message_id[0] will be non-zero.
1354
1355The general actions of this function are:
1356
1357 . Read the headers of the message (if any) into a chain of store
1358 blocks.
1359
1360 . If there is a "sender:" header and the message is locally originated,
69358f02
PH
1361 throw it away, unless the caller is trusted, or unless
1362 active_local_sender_retain is set - which can only happen if
1363 active_local_from_check is false.
059ec3d9
PH
1364
1365 . If recipients are to be extracted from the message, build the
1366 recipients list from the headers, removing any that were on the
1367 original recipients list (unless extract_addresses_remove_arguments is
1368 false), and at the same time, remove any bcc header that may be present.
1369
1370 . Get the spool file for the data, sort out its unique name, open
1371 and lock it (but don't give it the name yet).
1372
1373 . Generate a "Message-Id" header if the message doesn't have one, for
1374 locally-originated messages.
1375
1376 . Generate a "Received" header.
1377
1378 . Ensure the recipients list is fully qualified and rewritten if necessary.
1379
1380 . If there are any rewriting rules, apply them to the sender address
1381 and also to the headers.
1382
1383 . If there is no from: header, generate one, for locally-generated messages
1384 and messages in "submission mode" only.
1385
1386 . If the sender is local, check that from: is correct, and if not, generate
1387 a Sender: header, unless message comes from a trusted caller, or this
69358f02 1388 feature is disabled by active_local_from_check being false.
059ec3d9
PH
1389
1390 . If there is no "date" header, generate one, for locally-originated
1391 or submission mode messages only.
1392
1393 . Copy the rest of the input, or up to a terminating "." if in SMTP or
1394 dot_ends mode, to the data file. Leave it open, to hold the lock.
1395
1396 . Write the envelope and the headers to a new file.
1397
1398 . Set the name for the header file; close it.
1399
1400 . Set the name for the data file; close it.
1401
1402Because this function can potentially be called many times in a single
1403SMTP connection, all store should be got by store_get(), so that it will be
1404automatically retrieved after the message is accepted.
1405
1406FUDGE: It seems that sites on the net send out messages with just LF
1407terminators, despite the warnings in the RFCs, and other MTAs handle this. So
1408we make the CRs optional in all cases.
1409
1410July 2003: Bare CRs in messages, especially in header lines, cause trouble. A
1411new regime is now in place in which bare CRs in header lines are turned into LF
1412followed by a space, so as not to terminate the header line.
1413
1414February 2004: A bare LF in a header line in a message whose first line was
1415terminated by CRLF is treated in the same way as a bare CR.
1416
1417Arguments:
1418 extract_recip TRUE if recipients are to be extracted from the message's
1419 headers
1420
1421Returns: TRUE there are more messages to be read (SMTP input)
1422 FALSE there are no more messages to be read (non-SMTP input
1423 or SMTP connection collapsed, or other failure)
1424
1425When reading a message for filter testing, the returned value indicates
1426whether the headers (which is all that is read) were terminated by '.' or
1427not. */
1428
1429BOOL
1430receive_msg(BOOL extract_recip)
1431{
7156b1ef
NM
1432int i;
1433int rc = FAIL;
059ec3d9
PH
1434int msg_size = 0;
1435int process_info_len = Ustrlen(process_info);
1436int error_rc = (error_handling == ERRORS_SENDER)?
1437 errors_sender_rc : EXIT_FAILURE;
1438int header_size = 256;
1439int start, end, domain, size, sptr;
1440int id_resolution;
1441int had_zero = 0;
d677b2f2 1442int prevlines_length = 0;
059ec3d9
PH
1443
1444register int ptr = 0;
1445
1446BOOL contains_resent_headers = FALSE;
1447BOOL extracted_ignored = FALSE;
1448BOOL first_line_ended_crlf = TRUE_UNSET;
1449BOOL smtp_yield = TRUE;
1450BOOL yield = FALSE;
1451
1452BOOL resents_exist = FALSE;
1453uschar *resent_prefix = US"";
1454uschar *blackholed_by = NULL;
04f7d5b9 1455uschar *blackhole_log_msg = US"";
4ea50c5f 1456int cutthrough_done = 0;
059ec3d9
PH
1457
1458flock_t lock_data;
1459error_block *bad_addresses = NULL;
1460
1461uschar *frozen_by = NULL;
1462uschar *queued_by = NULL;
1463
1464uschar *errmsg, *s;
1465struct stat statbuf;
1466
4e88a19f 1467/* Final message to give to SMTP caller, and messages from ACLs */
059ec3d9
PH
1468
1469uschar *smtp_reply = NULL;
4e88a19f 1470uschar *user_msg, *log_msg;
059ec3d9
PH
1471
1472/* Working header pointers */
1473
1474header_line *h, *next;
1475
2cbb4081 1476/* Flags for noting the existence of certain headers (only one left) */
059ec3d9
PH
1477
1478BOOL date_header_exists = FALSE;
1479
1480/* Pointers to receive the addresses of headers whose contents we need. */
1481
1482header_line *from_header = NULL;
1483header_line *subject_header = NULL;
1484header_line *msgid_header = NULL;
1485header_line *received_header;
1486
4840604e
TL
1487#ifdef EXPERIMENTAL_DMARC
1488int dmarc_up = 0;
1489#endif /* EXPERIMENTAL_DMARC */
1490
059ec3d9
PH
1491/* Variables for use when building the Received: header. */
1492
059ec3d9
PH
1493uschar *timestamp;
1494int tslen;
1495
1496/* Release any open files that might have been cached while preparing to
1497accept the message - e.g. by verifying addresses - because reading a message
1498might take a fair bit of real time. */
1499
1500search_tidyup();
1501
e4bdf652
JH
1502/* Extracting the recipient list from an input file is incompatible with
1503cutthrough delivery with the no-spool option. It shouldn't be possible
817d9f57 1504to set up the combination, but just in case kill any ongoing connection. */
e4bdf652 1505if (extract_recip || !smtp_input)
2e5b33cd 1506 cancel_cutthrough_connection("not smtp input");
e4bdf652 1507
059ec3d9
PH
1508/* Initialize the chain of headers by setting up a place-holder for Received:
1509header. Temporarily mark it as "old", i.e. not to be used. We keep header_last
1510pointing to the end of the chain to make adding headers simple. */
1511
1512received_header = header_list = header_last = store_get(sizeof(header_line));
1513header_list->next = NULL;
1514header_list->type = htype_old;
1515header_list->text = NULL;
1516header_list->slen = 0;
1517
1518/* Control block for the next header to be read. */
1519
1520next = store_get(sizeof(header_line));
1521next->text = store_get(header_size);
1522
1523/* Initialize message id to be null (indicating no message read), and the
1524header names list to be the normal list. Indicate there is no data file open
1525yet, initialize the size and warning count, and deal with no size limit. */
1526
1527message_id[0] = 0;
1528data_file = NULL;
1529data_fd = -1;
1530spool_name[0] = 0;
1531message_size = 0;
1532warning_count = 0;
d677b2f2 1533received_count = 1; /* For the one we will add */
059ec3d9
PH
1534
1535if (thismessage_size_limit <= 0) thismessage_size_limit = INT_MAX;
1536
2e0c1448 1537/* While reading the message, the following counts are computed. */
059ec3d9 1538
d677b2f2
PH
1539message_linecount = body_linecount = body_zerocount =
1540 max_received_linelength = 0;
059ec3d9 1541
80a47a2c
TK
1542#ifndef DISABLE_DKIM
1543/* Call into DKIM to set up the context. */
1544if (smtp_input && !smtp_batched_input && !dkim_disable_verify) dkim_exim_verify_init();
fb2274d4
TK
1545#endif
1546
4840604e
TL
1547#ifdef EXPERIMENTAL_DMARC
1548/* initialize libopendmarc */
1549dmarc_up = dmarc_init();
1550#endif
1551
059ec3d9
PH
1552/* Remember the time of reception. Exim uses time+pid for uniqueness of message
1553ids, and fractions of a second are required. See the comments that precede the
1554message id creation below. */
1555
1556(void)gettimeofday(&message_id_tv, NULL);
1557
1558/* For other uses of the received time we can operate with granularity of one
1559second, and for that we use the global variable received_time. This is for
1560things like ultimate message timeouts. */
1561
1562received_time = message_id_tv.tv_sec;
1563
1564/* If SMTP input, set the special handler for timeouts. The alarm() calls
1565happen in the smtp_getc() function when it refills its buffer. */
1566
1567if (smtp_input) os_non_restarting_signal(SIGALRM, data_timeout_handler);
1568
1569/* If not SMTP input, timeout happens only if configured, and we just set a
1570single timeout for the whole message. */
1571
1572else if (receive_timeout > 0)
1573 {
1574 os_non_restarting_signal(SIGALRM, data_timeout_handler);
1575 alarm(receive_timeout);
1576 }
1577
1578/* SIGTERM and SIGINT are caught always. */
1579
1580signal(SIGTERM, data_sigterm_sigint_handler);
1581signal(SIGINT, data_sigterm_sigint_handler);
1582
1583/* Header lines in messages are not supposed to be very long, though when
1584unfolded, to: and cc: headers can take up a lot of store. We must also cope
1585with the possibility of junk being thrown at us. Start by getting 256 bytes for
1586storing the header, and extend this as necessary using string_cat().
1587
1588To cope with total lunacies, impose an upper limit on the length of the header
1589section of the message, as otherwise the store will fill up. We must also cope
1590with the possibility of binary zeros in the data. Hence we cannot use fgets().
1591Folded header lines are joined into one string, leaving the '\n' characters
1592inside them, so that writing them out reproduces the input.
1593
1594Loop for each character of each header; the next structure for chaining the
1595header is set up already, with ptr the offset of the next character in
1596next->text. */
1597
1598for (;;)
1599 {
80a47a2c 1600 int ch = (receive_getc)();
059ec3d9
PH
1601
1602 /* If we hit EOF on a SMTP connection, it's an error, since incoming
1603 SMTP must have a correct "." terminator. */
1604
1605 if (ch == EOF && smtp_input /* && !smtp_batched_input */)
1606 {
1607 smtp_reply = handle_lost_connection(US" (header)");
1608 smtp_yield = FALSE;
1609 goto TIDYUP; /* Skip to end of function */
1610 }
1611
1612 /* See if we are at the current header's size limit - there must be at least
1613 four bytes left. This allows for the new character plus a zero, plus two for
1614 extra insertions when we are playing games with dots and carriage returns. If
1615 we are at the limit, extend the text buffer. This could have been done
1616 automatically using string_cat() but because this is a tightish loop storing
1617 only one character at a time, we choose to do it inline. Normally
1618 store_extend() will be able to extend the block; only at the end of a big
1619 store block will a copy be needed. To handle the case of very long headers
1620 (and sometimes lunatic messages can have ones that are 100s of K long) we
1621 call store_release() for strings that have been copied - if the string is at
1622 the start of a block (and therefore the only thing in it, because we aren't
1623 doing any other gets), the block gets freed. We can only do this because we
1624 know there are no other calls to store_get() going on. */
1625
1626 if (ptr >= header_size - 4)
1627 {
1628 int oldsize = header_size;
1629 /* header_size += 256; */
1630 header_size *= 2;
1631 if (!store_extend(next->text, oldsize, header_size))
1632 {
1633 uschar *newtext = store_get(header_size);
1634 memcpy(newtext, next->text, ptr);
1635 store_release(next->text);
1636 next->text = newtext;
1637 }
1638 }
1639
1640 /* Cope with receiving a binary zero. There is dispute about whether
1641 these should be allowed in RFC 822 messages. The middle view is that they
1642 should not be allowed in headers, at least. Exim takes this attitude at
1643 the moment. We can't just stomp on them here, because we don't know that
1644 this line is a header yet. Set a flag to cause scanning later. */
1645
1646 if (ch == 0) had_zero++;
1647
1648 /* Test for termination. Lines in remote SMTP are terminated by CRLF, while
1649 those from data files use just LF. Treat LF in local SMTP input as a
1650 terminator too. Treat EOF as a line terminator always. */
1651
1652 if (ch == EOF) goto EOL;
1653
1654 /* FUDGE: There are sites out there that don't send CRs before their LFs, and
1655 other MTAs accept this. We are therefore forced into this "liberalisation"
1656 too, so we accept LF as a line terminator whatever the source of the message.
1657 However, if the first line of the message ended with a CRLF, we treat a bare
1658 LF specially by inserting a white space after it to ensure that the header
1659 line is not terminated. */
1660
1661 if (ch == '\n')
1662 {
1663 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = FALSE;
80a47a2c 1664 else if (first_line_ended_crlf) receive_ungetc(' ');
059ec3d9
PH
1665 goto EOL;
1666 }
1667
1668 /* This is not the end of the line. If this is SMTP input and this is
1669 the first character in the line and it is a "." character, ignore it.
1670 This implements the dot-doubling rule, though header lines starting with
1671 dots aren't exactly common. They are legal in RFC 822, though. If the
1672 following is CRLF or LF, this is the line that that terminates the
1673 entire message. We set message_ended to indicate this has happened (to
1674 prevent further reading), and break out of the loop, having freed the
1675 empty header, and set next = NULL to indicate no data line. */
1676
1677 if (ptr == 0 && ch == '.' && (smtp_input || dot_ends))
1678 {
80a47a2c 1679 ch = (receive_getc)();
059ec3d9
PH
1680 if (ch == '\r')
1681 {
80a47a2c 1682 ch = (receive_getc)();
059ec3d9
PH
1683 if (ch != '\n')
1684 {
80a47a2c 1685 receive_ungetc(ch);
059ec3d9
PH
1686 ch = '\r'; /* Revert to CR */
1687 }
1688 }
1689 if (ch == '\n')
1690 {
1691 message_ended = END_DOT;
1692 store_reset(next);
1693 next = NULL;
1694 break; /* End character-reading loop */
1695 }
1696
1697 /* For non-SMTP input, the dot at the start of the line was really a data
1698 character. What is now in ch is the following character. We guaranteed
1699 enough space for this above. */
1700
1701 if (!smtp_input)
1702 {
1703 next->text[ptr++] = '.';
1704 message_size++;
1705 }
1706 }
1707
1708 /* If CR is immediately followed by LF, end the line, ignoring the CR, and
1709 remember this case if this is the first line ending. */
1710
1711 if (ch == '\r')
1712 {
80a47a2c 1713 ch = (receive_getc)();
059ec3d9
PH
1714 if (ch == '\n')
1715 {
1716 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = TRUE;
1717 goto EOL;
1718 }
1719
1720 /* Otherwise, put back the character after CR, and turn the bare CR
1721 into LF SP. */
1722
80a47a2c 1723 ch = (receive_ungetc)(ch);
059ec3d9
PH
1724 next->text[ptr++] = '\n';
1725 message_size++;
1726 ch = ' ';
1727 }
1728
1729 /* We have a data character for the header line. */
1730
1731 next->text[ptr++] = ch; /* Add to buffer */
1732 message_size++; /* Total message size so far */
1733
1734 /* Handle failure due to a humungously long header section. The >= allows
1735 for the terminating \n. Add what we have so far onto the headers list so
1736 that it gets reflected in any error message, and back up the just-read
1737 character. */
1738
1739 if (message_size >= header_maxsize)
1740 {
1741 next->text[ptr] = 0;
1742 next->slen = ptr;
1743 next->type = htype_other;
1744 next->next = NULL;
1745 header_last->next = next;
1746 header_last = next;
1747
1748 log_write(0, LOG_MAIN, "ridiculously long message header received from "
1749 "%s (more than %d characters): message abandoned",
1750 sender_host_unknown? sender_ident : sender_fullhost, header_maxsize);
1751
1752 if (smtp_input)
1753 {
1754 smtp_reply = US"552 Message header is ridiculously long";
1755 receive_swallow_smtp();
1756 goto TIDYUP; /* Skip to end of function */
1757 }
1758
1759 else
1760 {
1761 give_local_error(ERRMESS_VLONGHEADER,
1762 string_sprintf("message header longer than %d characters received: "
1763 "message not accepted", header_maxsize), US"", error_rc, stdin,
1764 header_list->next);
1765 /* Does not return */
1766 }
1767 }
1768
1769 continue; /* With next input character */
1770
1771 /* End of header line reached */
1772
1773 EOL:
2e0c1448
PH
1774
1775 /* Keep track of lines for BSMTP errors and overall message_linecount. */
1776
1777 receive_linecount++;
1778 message_linecount++;
059ec3d9 1779
d677b2f2
PH
1780 /* Keep track of maximum line length */
1781
1782 if (ptr - prevlines_length > max_received_linelength)
1783 max_received_linelength = ptr - prevlines_length;
1784 prevlines_length = ptr + 1;
1785
059ec3d9
PH
1786 /* Now put in the terminating newline. There is always space for
1787 at least two more characters. */
1788
1789 next->text[ptr++] = '\n';
1790 message_size++;
1791
1792 /* A blank line signals the end of the headers; release the unwanted
1793 space and set next to NULL to indicate this. */
1794
1795 if (ptr == 1)
1796 {
1797 store_reset(next);
1798 next = NULL;
1799 break;
1800 }
1801
1802 /* There is data in the line; see if the next input character is a
1803 whitespace character. If it is, we have a continuation of this header line.
1804 There is always space for at least one character at this point. */
1805
1806 if (ch != EOF)
1807 {
80a47a2c 1808 int nextch = (receive_getc)();
059ec3d9
PH
1809 if (nextch == ' ' || nextch == '\t')
1810 {
1811 next->text[ptr++] = nextch;
1812 message_size++;
1813 continue; /* Iterate the loop */
1814 }
80a47a2c 1815 else if (nextch != EOF) (receive_ungetc)(nextch); /* For next time */
059ec3d9
PH
1816 else ch = EOF; /* Cause main loop to exit at end */
1817 }
1818
1819 /* We have got to the real line end. Terminate the string and release store
1820 beyond it. If it turns out to be a real header, internal binary zeros will
1821 be squashed later. */
1822
1823 next->text[ptr] = 0;
1824 next->slen = ptr;
1825 store_reset(next->text + ptr + 1);
1826
1827 /* Check the running total size against the overall message size limit. We
1828 don't expect to fail here, but if the overall limit is set less than MESSAGE_
1829 MAXSIZE and a big header is sent, we want to catch it. Just stop reading
1830 headers - the code to read the body will then also hit the buffer. */
1831
1832 if (message_size > thismessage_size_limit) break;
1833
1834 /* A line that is not syntactically correct for a header also marks
1835 the end of the headers. In this case, we leave next containing the
1836 first data line. This might actually be several lines because of the
1837 continuation logic applied above, but that doesn't matter.
1838
1839 It turns out that smail, and presumably sendmail, accept leading lines
1840 of the form
1841
1842 From ph10 Fri Jan 5 12:35 GMT 1996
1843
1844 in messages. The "mail" command on Solaris 2 sends such lines. I cannot
1845 find any documentation of this, but for compatibility it had better be
1846 accepted. Exim restricts it to the case of non-smtp messages, and
1847 treats it as an alternative to the -f command line option. Thus it is
1848 ignored except for trusted users or filter testing. Otherwise it is taken
1849 as the sender address, unless -f was used (sendmail compatibility).
1850
1851 It further turns out that some UUCPs generate the From_line in a different
1852 format, e.g.
1853
1854 From ph10 Fri, 7 Jan 97 14:00:00 GMT
1855
1856 The regex for matching these things is now capable of recognizing both
1857 formats (including 2- and 4-digit years in the latter). In fact, the regex
1858 is now configurable, as is the expansion string to fish out the sender.
1859
1860 Even further on it has been discovered that some broken clients send
1861 these lines in SMTP messages. There is now an option to ignore them from
1862 specified hosts or networks. Sigh. */
1863
1864 if (header_last == header_list &&
1865 (!smtp_input
1866 ||
1867 (sender_host_address != NULL &&
1868 verify_check_host(&ignore_fromline_hosts) == OK)
1869 ||
1870 (sender_host_address == NULL && ignore_fromline_local)
1871 ) &&
1872 regex_match_and_setup(regex_From, next->text, 0, -1))
1873 {
1874 if (!sender_address_forced)
1875 {
1876 uschar *uucp_sender = expand_string(uucp_from_sender);
1877 if (uucp_sender == NULL)
1878 {
1879 log_write(0, LOG_MAIN|LOG_PANIC,
1880 "expansion of \"%s\" failed after matching "
1881 "\"From \" line: %s", uucp_from_sender, expand_string_message);
1882 }
1883 else
1884 {
1885 int start, end, domain;
1886 uschar *errmess;
1887 uschar *newsender = parse_extract_address(uucp_sender, &errmess,
1888 &start, &end, &domain, TRUE);
1889 if (newsender != NULL)
1890 {
1891 if (domain == 0 && newsender[0] != 0)
1892 newsender = rewrite_address_qualify(newsender, FALSE);
1893
f05da2e8 1894 if (filter_test != FTEST_NONE || receive_check_set_sender(newsender))
059ec3d9
PH
1895 {
1896 sender_address = newsender;
1897
f05da2e8 1898 if (trusted_caller || filter_test != FTEST_NONE)
059ec3d9
PH
1899 {
1900 authenticated_sender = NULL;
1901 originator_name = US"";
1902 sender_local = FALSE;
1903 }
1904
f05da2e8 1905 if (filter_test != FTEST_NONE)
059ec3d9
PH
1906 printf("Sender taken from \"From \" line\n");
1907 }
1908 }
1909 }
1910 }
1911 }
1912
1913 /* Not a leading "From " line. Check to see if it is a valid header line.
1914 Header names may contain any non-control characters except space and colon,
1915 amazingly. */
1916
1917 else
1918 {
1919 uschar *p = next->text;
1920
1921 /* If not a valid header line, break from the header reading loop, leaving
1922 next != NULL, indicating that it holds the first line of the body. */
1923
1924 if (isspace(*p)) break;
1925 while (mac_isgraph(*p) && *p != ':') p++;
1926 while (isspace(*p)) p++;
1927 if (*p != ':')
1928 {
1929 body_zerocount = had_zero;
1930 break;
1931 }
1932
1933 /* We have a valid header line. If there were any binary zeroes in
1934 the line, stomp on them here. */
1935
1936 if (had_zero > 0)
1937 for (p = next->text; p < next->text + ptr; p++) if (*p == 0) *p = '?';
1938
1939 /* It is perfectly legal to have an empty continuation line
1940 at the end of a header, but it is confusing to humans
1941 looking at such messages, since it looks like a blank line.
1942 Reduce confusion by removing redundant white space at the
1943 end. We know that there is at least one printing character
1944 (the ':' tested for above) so there is no danger of running
1945 off the end. */
1946
1947 p = next->text + ptr - 2;
1948 for (;;)
1949 {
1950 while (*p == ' ' || *p == '\t') p--;
1951 if (*p != '\n') break;
1952 ptr = (p--) - next->text + 1;
1953 message_size -= next->slen - ptr;
1954 next->text[ptr] = 0;
1955 next->slen = ptr;
1956 }
1957
1958 /* Add the header to the chain */
1959
1960 next->type = htype_other;
1961 next->next = NULL;
1962 header_last->next = next;
1963 header_last = next;
1964
1965 /* Check the limit for individual line lengths. This comes after adding to
1966 the chain so that the failing line is reflected if a bounce is generated
1967 (for a local message). */
1968
1969 if (header_line_maxsize > 0 && next->slen > header_line_maxsize)
1970 {
1971 log_write(0, LOG_MAIN, "overlong message header line received from "
1972 "%s (more than %d characters): message abandoned",
1973 sender_host_unknown? sender_ident : sender_fullhost,
1974 header_line_maxsize);
1975
1976 if (smtp_input)
1977 {
1978 smtp_reply = US"552 A message header line is too long";
1979 receive_swallow_smtp();
1980 goto TIDYUP; /* Skip to end of function */
1981 }
1982
1983 else
1984 {
1985 give_local_error(ERRMESS_VLONGHDRLINE,
1986 string_sprintf("message header line longer than %d characters "
1987 "received: message not accepted", header_line_maxsize), US"",
1988 error_rc, stdin, header_list->next);
1989 /* Does not return */
1990 }
1991 }
1992
1993 /* Note if any resent- fields exist. */
1994
1995 if (!resents_exist && strncmpic(next->text, US"resent-", 7) == 0)
1996 {
1997 resents_exist = TRUE;
1998 resent_prefix = US"Resent-";
1999 }
2000 }
2001
2002 /* The line has been handled. If we have hit EOF, break out of the loop,
2003 indicating no pending data line. */
2004
2005 if (ch == EOF) { next = NULL; break; }
2006
2007 /* Set up for the next header */
2008
2009 header_size = 256;
2010 next = store_get(sizeof(header_line));
2011 next->text = store_get(header_size);
2012 ptr = 0;
2013 had_zero = 0;
d677b2f2 2014 prevlines_length = 0;
059ec3d9
PH
2015 } /* Continue, starting to read the next header */
2016
2017/* At this point, we have read all the headers into a data structure in main
2018store. The first header is still the dummy placeholder for the Received: header
2019we are going to generate a bit later on. If next != NULL, it contains the first
2020data line - which terminated the headers before reaching a blank line (not the
2021normal case). */
2022
2023DEBUG(D_receive)
2024 {
2025 debug_printf(">>Headers received:\n");
2026 for (h = header_list->next; h != NULL; h = h->next)
2027 debug_printf("%s", h->text);
2028 debug_printf("\n");
2029 }
2030
2031/* End of file on any SMTP connection is an error. If an incoming SMTP call
2032is dropped immediately after valid headers, the next thing we will see is EOF.
2033We must test for this specially, as further down the reading of the data is
2034skipped if already at EOF. */
2035
2036if (smtp_input && (receive_feof)())
2037 {
2038 smtp_reply = handle_lost_connection(US" (after header)");
2039 smtp_yield = FALSE;
2040 goto TIDYUP; /* Skip to end of function */
2041 }
2042
2043/* If this is a filter test run and no headers were read, output a warning
2044in case there is a mistake in the test message. */
2045
f05da2e8 2046if (filter_test != FTEST_NONE && header_list->next == NULL)
059ec3d9
PH
2047 printf("Warning: no message headers read\n");
2048
2049
2050/* Scan the headers to identify them. Some are merely marked for later
2051processing; some are dealt with here. */
2052
2053for (h = header_list->next; h != NULL; h = h->next)
2054 {
2055 BOOL is_resent = strncmpic(h->text, US"resent-", 7) == 0;
2056 if (is_resent) contains_resent_headers = TRUE;
2057
2058 switch (header_checkname(h, is_resent))
2059 {
059ec3d9 2060 case htype_bcc:
2cbb4081 2061 h->type = htype_bcc; /* Both Bcc: and Resent-Bcc: */
059ec3d9
PH
2062 break;
2063
059ec3d9 2064 case htype_cc:
2cbb4081 2065 h->type = htype_cc; /* Both Cc: and Resent-Cc: */
059ec3d9
PH
2066 break;
2067
2068 /* Record whether a Date: or Resent-Date: header exists, as appropriate. */
2069
2070 case htype_date:
4c69d561 2071 if (!resents_exist || is_resent) date_header_exists = TRUE;
059ec3d9
PH
2072 break;
2073
2074 /* Same comments as about Return-Path: below. */
2075
2076 case htype_delivery_date:
2077 if (delivery_date_remove) h->type = htype_old;
2078 break;
2079
2080 /* Same comments as about Return-Path: below. */
2081
2082 case htype_envelope_to:
2083 if (envelope_to_remove) h->type = htype_old;
2084 break;
2085
2086 /* Mark all "From:" headers so they get rewritten. Save the one that is to
2087 be used for Sender: checking. For Sendmail compatibility, if the "From:"
2088 header consists of just the login id of the user who called Exim, rewrite
2089 it with the gecos field first. Apply this rule to Resent-From: if there
2090 are resent- fields. */
2091
2092 case htype_from:
2093 h->type = htype_from;
2094 if (!resents_exist || is_resent)
2095 {
2096 from_header = h;
2097 if (!smtp_input)
2098 {
5de8faa3 2099 int len;
059ec3d9
PH
2100 uschar *s = Ustrchr(h->text, ':') + 1;
2101 while (isspace(*s)) s++;
5de8faa3 2102 len = h->slen - (s - h->text) - 1;
e0fccd1d
TF
2103 if (Ustrlen(originator_login) == len &&
2104 strncmpic(s, originator_login, len) == 0)
059ec3d9
PH
2105 {
2106 uschar *name = is_resent? US"Resent-From" : US"From";
2107 header_add(htype_from, "%s: %s <%s@%s>\n", name, originator_name,
2108 originator_login, qualify_domain_sender);
2109 from_header = header_last;
2110 h->type = htype_old;
2111 DEBUG(D_receive|D_rewrite)
2112 debug_printf("rewrote \"%s:\" header using gecos\n", name);
2113 }
2114 }
2115 }
2116 break;
2117
2118 /* Identify the Message-id: header for generating "in-reply-to" in the
2119 autoreply transport. For incoming logging, save any resent- value. In both
2120 cases, take just the first of any multiples. */
2121
2122 case htype_id:
2123 if (msgid_header == NULL && (!resents_exist || is_resent))
2124 {
2125 msgid_header = h;
2126 h->type = htype_id;
2127 }
2128 break;
2129
2130 /* Flag all Received: headers */
2131
2132 case htype_received:
2133 h->type = htype_received;
2134 received_count++;
2135 break;
2136
2137 /* "Reply-to:" is just noted (there is no resent-reply-to field) */
2138
2139 case htype_reply_to:
2140 h->type = htype_reply_to;
2141 break;
2142
2143 /* The Return-path: header is supposed to be added to messages when
2144 they leave the SMTP system. We shouldn't receive messages that already
2145 contain Return-path. However, since Exim generates Return-path: on
2146 local delivery, resent messages may well contain it. We therefore
2147 provide an option (which defaults on) to remove any Return-path: headers
2148 on input. Removal actually means flagging as "old", which prevents the
2149 header being transmitted with the message. */
2150
2151 case htype_return_path:
2152 if (return_path_remove) h->type = htype_old;
2153
2154 /* If we are testing a mail filter file, use the value of the
2155 Return-Path: header to set up the return_path variable, which is not
2156 otherwise set. However, remove any <> that surround the address
2157 because the variable doesn't have these. */
2158
f05da2e8 2159 if (filter_test != FTEST_NONE)
059ec3d9
PH
2160 {
2161 uschar *start = h->text + 12;
2162 uschar *end = start + Ustrlen(start);
2163 while (isspace(*start)) start++;
2164 while (end > start && isspace(end[-1])) end--;
2165 if (*start == '<' && end[-1] == '>')
2166 {
2167 start++;
2168 end--;
2169 }
2170 return_path = string_copyn(start, end - start);
2171 printf("Return-path taken from \"Return-path:\" header line\n");
2172 }
2173 break;
2174
2175 /* If there is a "Sender:" header and the message is locally originated,
8800895a
PH
2176 and from an untrusted caller and suppress_local_fixups is not set, or if we
2177 are in submission mode for a remote message, mark it "old" so that it will
2178 not be transmitted with the message, unless active_local_sender_retain is
2179 set. (This can only be true if active_local_from_check is false.) If there
2180 are any resent- headers in the message, apply this rule to Resent-Sender:
2181 instead of Sender:. Messages with multiple resent- header sets cannot be
2182 tidily handled. (For this reason, at least one MUA - Pine - turns old
2183 resent- headers into X-resent- headers when resending, leaving just one
2184 set.) */
059ec3d9
PH
2185
2186 case htype_sender:
69358f02 2187 h->type = ((!active_local_sender_retain &&
8800895a
PH
2188 (
2189 (sender_local && !trusted_caller && !suppress_local_fixups)
2190 || submission_mode
2191 )
059ec3d9
PH
2192 ) &&
2193 (!resents_exist||is_resent))?
2194 htype_old : htype_sender;
2195 break;
2196
2197 /* Remember the Subject: header for logging. There is no Resent-Subject */
2198
2199 case htype_subject:
2200 subject_header = h;
2201 break;
2202
2203 /* "To:" gets flagged, and the existence of a recipient header is noted,
2204 whether it's resent- or not. */
2205
2206 case htype_to:
2207 h->type = htype_to;
2208 /****
2209 to_or_cc_header_exists = TRUE;
2210 ****/
2211 break;
2212 }
2213 }
2214
2215/* Extract recipients from the headers if that is required (the -t option).
2216Note that this is documented as being done *before* any address rewriting takes
2217place. There are two possibilities:
2218
2219(1) According to sendmail documentation for Solaris, IRIX, and HP-UX, any
2220recipients already listed are to be REMOVED from the message. Smail 3 works
2221like this. We need to build a non-recipients tree for that list, because in
2222subsequent processing this data is held in a tree and that's what the
2223spool_write_header() function expects. Make sure that non-recipient addresses
2224are fully qualified and rewritten if necessary.
2225
2226(2) According to other sendmail documentation, -t ADDS extracted recipients to
2227those in the command line arguments (and it is rumoured some other MTAs do
2228this). Therefore, there is an option to make Exim behave this way.
2229
2230*** Notes on "Resent-" header lines ***
2231
2232The presence of resent-headers in the message makes -t horribly ambiguous.
2233Experiments with sendmail showed that it uses recipients for all resent-
2234headers, totally ignoring the concept of "sets of resent- headers" as described
2235in RFC 2822 section 3.6.6. Sendmail also amalgamates them into a single set
2236with all the addresses in one instance of each header.
2237
2238This seems to me not to be at all sensible. Before release 4.20, Exim 4 gave an
2239error for -t if there were resent- headers in the message. However, after a
2240discussion on the mailing list, I've learned that there are MUAs that use
2241resent- headers with -t, and also that the stuff about sets of resent- headers
2242and their ordering in RFC 2822 is generally ignored. An MUA that submits a
2243message with -t and resent- header lines makes sure that only *its* resent-
2244headers are present; previous ones are often renamed as X-resent- for example.
2245
2246Consequently, Exim has been changed so that, if any resent- header lines are
2247present, the recipients are taken from all of the appropriate resent- lines,
2248and not from the ordinary To:, Cc:, etc. */
2249
2250if (extract_recip)
2251 {
2252 int rcount = 0;
2253 error_block **bnext = &bad_addresses;
2254
2255 if (extract_addresses_remove_arguments)
2256 {
2257 while (recipients_count-- > 0)
2258 {
2259 uschar *s = rewrite_address(recipients_list[recipients_count].address,
2260 TRUE, TRUE, global_rewrite_rules, rewrite_existflags);
2261 tree_add_nonrecipient(s);
2262 }
2263 recipients_list = NULL;
2264 recipients_count = recipients_list_max = 0;
2265 }
2266
059ec3d9
PH
2267 /* Now scan the headers */
2268
2269 for (h = header_list->next; h != NULL; h = h->next)
2270 {
2271 if ((h->type == htype_to || h->type == htype_cc || h->type == htype_bcc) &&
2272 (!contains_resent_headers || strncmpic(h->text, US"resent-", 7) == 0))
2273 {
2274 uschar *s = Ustrchr(h->text, ':') + 1;
2275 while (isspace(*s)) s++;
2276
1eccaa59
PH
2277 parse_allow_group = TRUE; /* Allow address group syntax */
2278
059ec3d9
PH
2279 while (*s != 0)
2280 {
2281 uschar *ss = parse_find_address_end(s, FALSE);
2282 uschar *recipient, *errmess, *p, *pp;
2283 int start, end, domain;
2284
2285 /* Check on maximum */
2286
2287 if (recipients_max > 0 && ++rcount > recipients_max)
2288 {
2289 give_local_error(ERRMESS_TOOMANYRECIP, US"too many recipients",
2290 US"message rejected: ", error_rc, stdin, NULL);
2291 /* Does not return */
2292 }
2293
2294 /* Make a copy of the address, and remove any internal newlines. These
2295 may be present as a result of continuations of the header line. The
2296 white space that follows the newline must not be removed - it is part
2297 of the header. */
2298
2299 pp = recipient = store_get(ss - s + 1);
2300 for (p = s; p < ss; p++) if (*p != '\n') *pp++ = *p;
2301 *pp = 0;
2302 recipient = parse_extract_address(recipient, &errmess, &start, &end,
2303 &domain, FALSE);
2304
2305 /* Keep a list of all the bad addresses so we can send a single
2306 error message at the end. However, an empty address is not an error;
2307 just ignore it. This can come from an empty group list like
2308
2309 To: Recipients of list:;
2310
2311 If there are no recipients at all, an error will occur later. */
2312
2313 if (recipient == NULL && Ustrcmp(errmess, "empty address") != 0)
2314 {
2315 int len = Ustrlen(s);
2316 error_block *b = store_get(sizeof(error_block));
2317 while (len > 0 && isspace(s[len-1])) len--;
2318 b->next = NULL;
2319 b->text1 = string_printing(string_copyn(s, len));
2320 b->text2 = errmess;
2321 *bnext = b;
2322 bnext = &(b->next);
2323 }
2324
2325 /* If the recipient is already in the nonrecipients tree, it must
2326 have appeared on the command line with the option extract_addresses_
2327 remove_arguments set. Do not add it to the recipients, and keep a note
2328 that this has happened, in order to give a better error if there are
2329 no recipients left. */
2330
2331 else if (recipient != NULL)
2332 {
2333 if (tree_search(tree_nonrecipients, recipient) == NULL)
2334 receive_add_recipient(recipient, -1);
2335 else
2336 extracted_ignored = TRUE;
2337 }
2338
2339 /* Move on past this address */
2340
2341 s = ss + (*ss? 1:0);
2342 while (isspace(*s)) s++;
1eccaa59
PH
2343 } /* Next address */
2344
2345 parse_allow_group = FALSE; /* Reset group syntax flags */
2346 parse_found_group = FALSE;
059ec3d9
PH
2347
2348 /* If this was the bcc: header, mark it "old", which means it
2349 will be kept on the spool, but not transmitted as part of the
2350 message. */
2351
2cbb4081 2352 if (h->type == htype_bcc) h->type = htype_old;
059ec3d9
PH
2353 } /* For appropriate header line */
2354 } /* For each header line */
2355
059ec3d9
PH
2356 }
2357
2358/* Now build the unique message id. This has changed several times over the
2359lifetime of Exim. This description was rewritten for Exim 4.14 (February 2003).
2360Retaining all the history in the comment has become too unwieldy - read
2361previous release sources if you want it.
2362
2363The message ID has 3 parts: tttttt-pppppp-ss. Each part is a number in base 62.
2364The first part is the current time, in seconds. The second part is the current
2365pid. Both are large enough to hold 32-bit numbers in base 62. The third part
2366can hold a number in the range 0-3843. It used to be a computed sequence
2367number, but is now the fractional component of the current time in units of
23681/2000 of a second (i.e. a value in the range 0-1999). After a message has been
2369received, Exim ensures that the timer has ticked at the appropriate level
2370before proceeding, to avoid duplication if the pid happened to be re-used
2371within the same time period. It seems likely that most messages will take at
2372least half a millisecond to be received, so no delay will normally be
2373necessary. At least for some time...
2374
2375There is a modification when localhost_number is set. Formerly this was allowed
2376to be as large as 255. Now it is restricted to the range 0-16, and the final
2377component of the message id becomes (localhost_number * 200) + fractional time
2378in units of 1/200 of a second (i.e. a value in the range 0-3399).
2379
2380Some not-really-Unix operating systems use case-insensitive file names (Darwin,
2381Cygwin). For these, we have to use base 36 instead of base 62. Luckily, this
2382still allows the tttttt field to hold a large enough number to last for some
2383more decades, and the final two-digit field can hold numbers up to 1295, which
2384is enough for milliseconds (instead of 1/2000 of a second).
2385
2386However, the pppppp field cannot hold a 32-bit pid, but it can hold a 31-bit
2387pid, so it is probably safe because pids have to be positive. The
2388localhost_number is restricted to 0-10 for these hosts, and when it is set, the
2389final field becomes (localhost_number * 100) + fractional time in centiseconds.
2390
2391Note that string_base62() returns its data in a static storage block, so it
2392must be copied before calling string_base62() again. It always returns exactly
23936 characters.
2394
2395There doesn't seem to be anything in the RFC which requires a message id to
2396start with a letter, but Smail was changed to ensure this. The external form of
2397the message id (as supplied by string expansion) therefore starts with an
2398additional leading 'E'. The spool file names do not include this leading
2399letter and it is not used internally.
2400
2401NOTE: If ever the format of message ids is changed, the regular expression for
2402checking that a string is in this format must be updated in a corresponding
2403way. It appears in the initializing code in exim.c. The macro MESSAGE_ID_LENGTH
2404must also be changed to reflect the correct string length. Then, of course,
2405other programs that rely on the message id format will need updating too. */
2406
2407Ustrncpy(message_id, string_base62((long int)(message_id_tv.tv_sec)), 6);
2408message_id[6] = '-';
2409Ustrncpy(message_id + 7, string_base62((long int)getpid()), 6);
2410
2411/* Deal with the case where the host number is set. The value of the number was
2412checked when it was read, to ensure it isn't too big. The timing granularity is
2413left in id_resolution so that an appropriate wait can be done after receiving
2414the message, if necessary (we hope it won't be). */
2415
2416if (host_number_string != NULL)
2417 {
2418 id_resolution = (BASE_62 == 62)? 5000 : 10000;
2419 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2420 string_base62((long int)(
2421 host_number * (1000000/id_resolution) +
2422 message_id_tv.tv_usec/id_resolution)) + 4);
2423 }
2424
2425/* Host number not set: final field is just the fractional time at an
2426appropriate resolution. */
2427
2428else
2429 {
2430 id_resolution = (BASE_62 == 62)? 500 : 1000;
2431 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2432 string_base62((long int)(message_id_tv.tv_usec/id_resolution)) + 4);
2433 }
2434
2435/* Add the current message id onto the current process info string if
2436it will fit. */
2437
2438(void)string_format(process_info + process_info_len,
2439 PROCESS_INFO_SIZE - process_info_len, " id=%s", message_id);
2440
2441/* If we are using multiple input directories, set up the one for this message
2442to be the least significant base-62 digit of the time of arrival. Otherwise
2443ensure that it is an empty string. */
2444
2445message_subdir[0] = split_spool_directory? message_id[5] : 0;
2446
2447/* Now that we have the message-id, if there is no message-id: header, generate
8800895a
PH
2448one, but only for local (without suppress_local_fixups) or submission mode
2449messages. This can be user-configured if required, but we had better flatten
2450any illegal characters therein. */
059ec3d9 2451
8800895a
PH
2452if (msgid_header == NULL &&
2453 ((sender_host_address == NULL && !suppress_local_fixups)
2454 || submission_mode))
059ec3d9
PH
2455 {
2456 uschar *p;
2457 uschar *id_text = US"";
2458 uschar *id_domain = primary_hostname;
2459
2460 /* Permit only letters, digits, dots, and hyphens in the domain */
2461
2462 if (message_id_domain != NULL)
2463 {
2464 uschar *new_id_domain = expand_string(message_id_domain);
2465 if (new_id_domain == NULL)
2466 {
2467 if (!expand_string_forcedfail)
2468 log_write(0, LOG_MAIN|LOG_PANIC,
2469 "expansion of \"%s\" (message_id_header_domain) "
2470 "failed: %s", message_id_domain, expand_string_message);
2471 }
2472 else if (*new_id_domain != 0)
2473 {
2474 id_domain = new_id_domain;
2475 for (p = id_domain; *p != 0; p++)
2476 if (!isalnum(*p) && *p != '.') *p = '-'; /* No need to test '-' ! */
2477 }
2478 }
2479
2480 /* Permit all characters except controls and RFC 2822 specials in the
2481 additional text part. */
2482
2483 if (message_id_text != NULL)
2484 {
2485 uschar *new_id_text = expand_string(message_id_text);
2486 if (new_id_text == NULL)
2487 {
2488 if (!expand_string_forcedfail)
2489 log_write(0, LOG_MAIN|LOG_PANIC,
2490 "expansion of \"%s\" (message_id_header_text) "
2491 "failed: %s", message_id_text, expand_string_message);
2492 }
2493 else if (*new_id_text != 0)
2494 {
2495 id_text = new_id_text;
2496 for (p = id_text; *p != 0; p++)
2497 if (mac_iscntrl_or_special(*p)) *p = '-';
2498 }
2499 }
2500
e7e680d6
PP
2501 /* Add the header line
2502 * Resent-* headers are prepended, per RFC 5322 3.6.6. Non-Resent-* are
2503 * appended, to preserve classical expectations of header ordering. */
059ec3d9 2504
e7e680d6 2505 header_add_at_position(!resents_exist, NULL, FALSE, htype_id,
5eb690a1
NM
2506 "%sMessage-Id: <%s%s%s@%s>\n", resent_prefix, message_id_external,
2507 (*id_text == 0)? "" : ".", id_text, id_domain);
059ec3d9
PH
2508 }
2509
2510/* If we are to log recipients, keep a copy of the raw ones before any possible
2511rewriting. Must copy the count, because later ACLs and the local_scan()
2512function may mess with the real recipients. */
2513
2514if ((log_extra_selector & LX_received_recipients) != 0)
2515 {
2516 raw_recipients = store_get(recipients_count * sizeof(uschar *));
2517 for (i = 0; i < recipients_count; i++)
2518 raw_recipients[i] = string_copy(recipients_list[i].address);
2519 raw_recipients_count = recipients_count;
2520 }
2521
2522/* Ensure the recipients list is fully qualified and rewritten. Unqualified
2523recipients will get here only if the conditions were right (allow_unqualified_
2524recipient is TRUE). */
2525
2526for (i = 0; i < recipients_count; i++)
2527 recipients_list[i].address =
2528 rewrite_address(recipients_list[i].address, TRUE, TRUE,
2529 global_rewrite_rules, rewrite_existflags);
2530
8800895a
PH
2531/* If there is no From: header, generate one for local (without
2532suppress_local_fixups) or submission_mode messages. If there is no sender
2533address, but the sender is local or this is a local delivery error, use the
2534originator login. This shouldn't happen for genuine bounces, but might happen
2535for autoreplies. The addition of From: must be done *before* checking for the
2536possible addition of a Sender: header, because untrusted_set_sender allows an
2537untrusted user to set anything in the envelope (which might then get info
2538From:) but we still want to ensure a valid Sender: if it is required. */
2539
2540if (from_header == NULL &&
2541 ((sender_host_address == NULL && !suppress_local_fixups)
2542 || submission_mode))
059ec3d9 2543 {
2fe1a124
PH
2544 uschar *oname = US"";
2545
2546 /* Use the originator_name if this is a locally submitted message and the
2547 caller is not trusted. For trusted callers, use it only if -F was used to
2548 force its value or if we have a non-SMTP message for which -f was not used
2549 to set the sender. */
2550
2551 if (sender_host_address == NULL)
2552 {
2553 if (!trusted_caller || sender_name_forced ||
2554 (!smtp_input && !sender_address_forced))
2555 oname = originator_name;
2556 }
2557
2558 /* For non-locally submitted messages, the only time we use the originator
2559 name is when it was forced by the /name= option on control=submission. */
2560
2561 else
2562 {
2563 if (submission_name != NULL) oname = submission_name;
2564 }
2565
059ec3d9
PH
2566 /* Envelope sender is empty */
2567
2568 if (sender_address[0] == 0)
2569 {
87ba3f5f
PH
2570 uschar *fromstart, *fromend;
2571
2572 fromstart = string_sprintf("%sFrom: %s%s", resent_prefix,
2fe1a124
PH
2573 oname, (oname[0] == 0)? "" : " <");
2574 fromend = (oname[0] == 0)? US"" : US">";
87ba3f5f 2575
059ec3d9
PH
2576 if (sender_local || local_error_message)
2577 {
87ba3f5f
PH
2578 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2579 local_part_quote(originator_login), qualify_domain_sender,
2580 fromend);
059ec3d9
PH
2581 }
2582 else if (submission_mode && authenticated_id != NULL)
2583 {
2584 if (submission_domain == NULL)
2585 {
87ba3f5f
PH
2586 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2587 local_part_quote(authenticated_id), qualify_domain_sender,
2588 fromend);
059ec3d9
PH
2589 }
2590 else if (submission_domain[0] == 0) /* empty => whole address set */
2591 {
87ba3f5f
PH
2592 header_add(htype_from, "%s%s%s\n", fromstart, authenticated_id,
2593 fromend);
059ec3d9
PH
2594 }
2595 else
2596 {
87ba3f5f
PH
2597 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2598 local_part_quote(authenticated_id), submission_domain,
2599 fromend);
059ec3d9
PH
2600 }
2601 from_header = header_last; /* To get it checked for Sender: */
2602 }
2603 }
2604
2605 /* There is a non-null envelope sender. Build the header using the original
2606 sender address, before any rewriting that might have been done while
2607 verifying it. */
2608
2609 else
2610 {
87ba3f5f 2611 header_add(htype_from, "%sFrom: %s%s%s%s\n", resent_prefix,
2fe1a124
PH
2612 oname,
2613 (oname[0] == 0)? "" : " <",
87ba3f5f
PH
2614 (sender_address_unrewritten == NULL)?
2615 sender_address : sender_address_unrewritten,
2fe1a124 2616 (oname[0] == 0)? "" : ">");
059ec3d9
PH
2617
2618 from_header = header_last; /* To get it checked for Sender: */
2619 }
2620 }
2621
2622
8800895a
PH
2623/* If the sender is local (without suppress_local_fixups), or if we are in
2624submission mode and there is an authenticated_id, check that an existing From:
2625is correct, and if not, generate a Sender: header, unless disabled. Any
2626previously-existing Sender: header was removed above. Note that sender_local,
2627as well as being TRUE if the caller of exim is not trusted, is also true if a
2628trusted caller did not supply a -f argument for non-smtp input. To allow
2629trusted callers to forge From: without supplying -f, we have to test explicitly
2630here. If the From: header contains more than one address, then the call to
2631parse_extract_address fails, and a Sender: header is inserted, as required. */
059ec3d9
PH
2632
2633if (from_header != NULL &&
69358f02 2634 (active_local_from_check &&
8800895a 2635 ((sender_local && !trusted_caller && !suppress_local_fixups) ||
69358f02 2636 (submission_mode && authenticated_id != NULL))
059ec3d9
PH
2637 ))
2638 {
2639 BOOL make_sender = TRUE;
2640 int start, end, domain;
2641 uschar *errmess;
2642 uschar *from_address =
2643 parse_extract_address(Ustrchr(from_header->text, ':') + 1, &errmess,
2644 &start, &end, &domain, FALSE);
2645 uschar *generated_sender_address;
2646
2647 if (submission_mode)
2648 {
2649 if (submission_domain == NULL)
2650 {
2651 generated_sender_address = string_sprintf("%s@%s",
2652 local_part_quote(authenticated_id), qualify_domain_sender);
2653 }
2654 else if (submission_domain[0] == 0) /* empty => full address */
2655 {
2656 generated_sender_address = string_sprintf("%s",
2657 authenticated_id);
2658 }
2659 else
2660 {
2661 generated_sender_address = string_sprintf("%s@%s",
2662 local_part_quote(authenticated_id), submission_domain);
2663 }
2664 }
2665 else
2666 generated_sender_address = string_sprintf("%s@%s",
2667 local_part_quote(originator_login), qualify_domain_sender);
2668
2669 /* Remove permitted prefixes and suffixes from the local part of the From:
2670 address before doing the comparison with the generated sender. */
2671
2672 if (from_address != NULL)
2673 {
2674 int slen;
2675 uschar *at = (domain == 0)? NULL : from_address + domain - 1;
2676
2677 if (at != NULL) *at = 0;
2678 from_address += route_check_prefix(from_address, local_from_prefix);
2679 slen = route_check_suffix(from_address, local_from_suffix);
2680 if (slen > 0)
2681 {
2682 memmove(from_address+slen, from_address, Ustrlen(from_address)-slen);
2683 from_address += slen;
2684 }
2685 if (at != NULL) *at = '@';
2686
2687 if (strcmpic(generated_sender_address, from_address) == 0 ||
2688 (domain == 0 && strcmpic(from_address, originator_login) == 0))
2689 make_sender = FALSE;
2690 }
2691
2692 /* We have to cause the Sender header to be rewritten if there are
2693 appropriate rewriting rules. */
2694
2695 if (make_sender)
2696 {
2fe1a124 2697 if (submission_mode && submission_name == NULL)
059ec3d9
PH
2698 header_add(htype_sender, "%sSender: %s\n", resent_prefix,
2699 generated_sender_address);
2700 else
2701 header_add(htype_sender, "%sSender: %s <%s>\n",
2fe1a124
PH
2702 resent_prefix,
2703 submission_mode? submission_name : originator_name,
2704 generated_sender_address);
059ec3d9 2705 }
87ba3f5f
PH
2706
2707 /* Ensure that a non-null envelope sender address corresponds to the
2708 submission mode sender address. */
2709
2710 if (submission_mode && sender_address[0] != 0)
2711 {
2712 if (sender_address_unrewritten == NULL)
2713 sender_address_unrewritten = sender_address;
2714 sender_address = generated_sender_address;
089793a4
TF
2715 if (Ustrcmp(sender_address_unrewritten, generated_sender_address) != 0)
2716 log_write(L_address_rewrite, LOG_MAIN,
2717 "\"%s\" from env-from rewritten as \"%s\" by submission mode",
2718 sender_address_unrewritten, generated_sender_address);
87ba3f5f 2719 }
059ec3d9
PH
2720 }
2721
059ec3d9
PH
2722/* If there are any rewriting rules, apply them to the sender address, unless
2723it has already been rewritten as part of verification for SMTP input. */
2724
2725if (global_rewrite_rules != NULL && sender_address_unrewritten == NULL &&
2726 sender_address[0] != 0)
2727 {
2728 sender_address = rewrite_address(sender_address, FALSE, TRUE,
2729 global_rewrite_rules, rewrite_existflags);
2730 DEBUG(D_receive|D_rewrite)
2731 debug_printf("rewritten sender = %s\n", sender_address);
2732 }
2733
2734
2735/* The headers must be run through rewrite_header(), because it ensures that
2736addresses are fully qualified, as well as applying any rewriting rules that may
2737exist.
2738
2739Qualification of header addresses in a message from a remote host happens only
2740if the host is in sender_unqualified_hosts or recipient_unqualified hosts, as
2741appropriate. For local messages, qualification always happens, unless -bnq is
2742used to explicitly suppress it. No rewriting is done for an unqualified address
2743that is left untouched.
2744
2745We start at the second header, skipping our own Received:. This rewriting is
2746documented as happening *after* recipient addresses are taken from the headers
2747by the -t command line option. An added Sender: gets rewritten here. */
2748
2749for (h = header_list->next; h != NULL; h = h->next)
2750 {
2751 header_line *newh = rewrite_header(h, NULL, NULL, global_rewrite_rules,
2752 rewrite_existflags, TRUE);
2753 if (newh != NULL) h = newh;
2754 }
2755
2756
2757/* An RFC 822 (sic) message is not legal unless it has at least one of "to",
2cbb4081 2758"cc", or "bcc". Note that although the minimal examples in RFC 822 show just
059ec3d9
PH
2759"to" or "bcc", the full syntax spec allows "cc" as well. If any resent- header
2760exists, this applies to the set of resent- headers rather than the normal set.
2761
2cbb4081
PH
2762The requirement for a recipient header has been removed in RFC 2822. At this
2763point in the code, earlier versions of Exim added a To: header for locally
2764submitted messages, and an empty Bcc: header for others. In the light of the
2765changes in RFC 2822, this was dropped in November 2003. */
059ec3d9 2766
059ec3d9
PH
2767
2768/* If there is no date header, generate one if the message originates locally
8800895a
PH
2769(i.e. not over TCP/IP) and suppress_local_fixups is not set, or if the
2770submission mode flag is set. Messages without Date: are not valid, but it seems
e7e680d6
PP
2771to be more confusing if Exim adds one to all remotely-originated messages.
2772As per Message-Id, we prepend if resending, else append.
2773*/
059ec3d9 2774
8800895a
PH
2775if (!date_header_exists &&
2776 ((sender_host_address == NULL && !suppress_local_fixups)
2777 || submission_mode))
e7e680d6
PP
2778 header_add_at_position(!resents_exist, NULL, FALSE, htype_other,
2779 "%sDate: %s\n", resent_prefix, tod_stamp(tod_full));
059ec3d9
PH
2780
2781search_tidyup(); /* Free any cached resources */
2782
2783/* Show the complete set of headers if debugging. Note that the first one (the
2784new Received:) has not yet been set. */
2785
2786DEBUG(D_receive)
2787 {
2788 debug_printf(">>Headers after rewriting and local additions:\n");
2789 for (h = header_list->next; h != NULL; h = h->next)
2790 debug_printf("%c %s", h->type, h->text);
2791 debug_printf("\n");
2792 }
2793
2794/* The headers are now complete in store. If we are running in filter
2795testing mode, that is all this function does. Return TRUE if the message
2796ended with a dot. */
2797
f05da2e8 2798if (filter_test != FTEST_NONE)
059ec3d9
PH
2799 {
2800 process_info[process_info_len] = 0;
2801 return message_ended == END_DOT;
2802 }
2803
817d9f57 2804/* Cutthrough delivery:
e4bdf652
JH
2805 We have to create the Received header now rather than at the end of reception,
2806 so the timestamp behaviour is a change to the normal case.
2807 XXX Ensure this gets documented XXX.
817d9f57 2808 Having created it, send the headers to the destination.
e4bdf652
JH
2809*/
2810if (cutthrough_fd >= 0)
2811 {
817d9f57
JH
2812 if (received_count > received_headers_max)
2813 {
2e5b33cd 2814 cancel_cutthrough_connection("too many headers");
817d9f57
JH
2815 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2816 log_write(0, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2817 "Too many \"Received\" headers",
2818 sender_address,
2819 (sender_fullhost == NULL)? "" : " H=",
2820 (sender_fullhost == NULL)? US"" : sender_fullhost,
2821 (sender_ident == NULL)? "" : " U=",
2822 (sender_ident == NULL)? US"" : sender_ident);
2823 message_id[0] = 0; /* Indicate no message accepted */
2824 smtp_reply = US"550 Too many \"Received\" headers - suspected mail loop";
2825 goto TIDYUP; /* Skip to end of function */
2826 }
e4bdf652
JH
2827 received_header_gen();
2828 add_acl_headers(US"MAIL or RCPT");
2829 (void) cutthrough_headers_send();
2830 }
61147df4 2831
e4bdf652 2832
059ec3d9
PH
2833/* Open a new spool file for the data portion of the message. We need
2834to access it both via a file descriptor and a stream. Try to make the
2835directory if it isn't there. Note re use of sprintf: spool_directory
2836is checked on input to be < 200 characters long. */
2837
2838sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory, message_subdir,
2839 message_id);
2840data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2841if (data_fd < 0)
2842 {
2843 if (errno == ENOENT)
2844 {
2845 uschar temp[16];
2846 sprintf(CS temp, "input/%s", message_subdir);
2847 if (message_subdir[0] == 0) temp[5] = 0;
2848 (void)directory_make(spool_directory, temp, INPUT_DIRECTORY_MODE, TRUE);
2849 data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2850 }
2851 if (data_fd < 0)
2852 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Failed to create spool file %s: %s",
2853 spool_name, strerror(errno));
2854 }
2855
2856/* Make sure the file's group is the Exim gid, and double-check the mode
2857because the group setting doesn't always get set automatically. */
2858
1ac6b2e7
JH
2859if (fchown(data_fd, exim_uid, exim_gid))
2860 log_write(0, LOG_MAIN|LOG_PANIC_DIE,
2861 "Failed setting ownership on spool file %s: %s",
2862 spool_name, strerror(errno));
ff790e47 2863(void)fchmod(data_fd, SPOOL_MODE);
059ec3d9
PH
2864
2865/* We now have data file open. Build a stream for it and lock it. We lock only
2866the first line of the file (containing the message ID) because otherwise there
2867are problems when Exim is run under Cygwin (I'm told). See comments in
2868spool_in.c, where the same locking is done. */
2869
2870data_file = fdopen(data_fd, "w+");
2871lock_data.l_type = F_WRLCK;
2872lock_data.l_whence = SEEK_SET;
2873lock_data.l_start = 0;
2874lock_data.l_len = SPOOL_DATA_START_OFFSET;
2875
2876if (fcntl(data_fd, F_SETLK, &lock_data) < 0)
2877 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Cannot lock %s (%d): %s", spool_name,
2878 errno, strerror(errno));
2879
2880/* We have an open, locked data file. Write the message id to it to make it
2881self-identifying. Then read the remainder of the input of this message and
2882write it to the data file. If the variable next != NULL, it contains the first
2883data line (which was read as a header but then turned out not to have the right
2884format); write it (remembering that it might contain binary zeros). The result
2885of fwrite() isn't inspected; instead we call ferror() below. */
2886
2887fprintf(data_file, "%s-D\n", message_id);
2888if (next != NULL)
2889 {
2890 uschar *s = next->text;
2891 int len = next->slen;
1ac6b2e7 2892 len = fwrite(s, 1, len, data_file); len = len; /* compiler quietening */
059ec3d9
PH
2893 body_linecount++; /* Assumes only 1 line */
2894 }
2895
2896/* Note that we might already be at end of file, or the logical end of file
2897(indicated by '.'), or might have encountered an error while writing the
2898message id or "next" line. */
2899
2900if (!ferror(data_file) && !(receive_feof)() && message_ended != END_DOT)
2901 {
2902 if (smtp_input)
2903 {
2904 message_ended = read_message_data_smtp(data_file);
2905 receive_linecount++; /* The terminating "." line */
2906 }
2907 else message_ended = read_message_data(data_file);
2908
2909 receive_linecount += body_linecount; /* For BSMTP errors mainly */
2e0c1448 2910 message_linecount += body_linecount;
059ec3d9
PH
2911
2912 /* Handle premature termination of SMTP */
2913
2914 if (smtp_input && message_ended == END_EOF)
2915 {
2916 Uunlink(spool_name); /* Lose data file when closed */
2e5b33cd 2917 cancel_cutthrough_connection("sender closed connection");
059ec3d9
PH
2918 message_id[0] = 0; /* Indicate no message accepted */
2919 smtp_reply = handle_lost_connection(US"");
2920 smtp_yield = FALSE;
2921 goto TIDYUP; /* Skip to end of function */
2922 }
2923
2924 /* Handle message that is too big. Don't use host_or_ident() in the log
2925 message; we want to see the ident value even for non-remote messages. */
2926
2927 if (message_ended == END_SIZE)
2928 {
2929 Uunlink(spool_name); /* Lose the data file when closed */
2e5b33cd 2930 cancel_cutthrough_connection("mail too big");
059ec3d9
PH
2931 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2932
2933 log_write(L_size_reject, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2934 "message too big: read=%d max=%d",
2935 sender_address,
2936 (sender_fullhost == NULL)? "" : " H=",
2937 (sender_fullhost == NULL)? US"" : sender_fullhost,
2938 (sender_ident == NULL)? "" : " U=",
2939 (sender_ident == NULL)? US"" : sender_ident,
2940 message_size,
2941 thismessage_size_limit);
2942
2943 if (smtp_input)
2944 {
2945 smtp_reply = US"552 Message size exceeds maximum permitted";
2946 message_id[0] = 0; /* Indicate no message accepted */
2947 goto TIDYUP; /* Skip to end of function */
2948 }
2949 else
2950 {
2951 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2952 give_local_error(ERRMESS_TOOBIG,
2953 string_sprintf("message too big (max=%d)", thismessage_size_limit),
2954 US"message rejected: ", error_rc, data_file, header_list);
2955 /* Does not return */
2956 }
2957 }
2958 }
2959
2960/* Restore the standard SIGALRM handler for any subsequent processing. (For
2961example, there may be some expansion in an ACL that uses a timer.) */
2962
2963os_non_restarting_signal(SIGALRM, sigalrm_handler);
2964
2965/* The message body has now been read into the data file. Call fflush() to
2966empty the buffers in C, and then call fsync() to get the data written out onto
2967the disk, as fflush() doesn't do this (or at least, it isn't documented as
2968having to do this). If there was an I/O error on either input or output,
2969attempt to send an error message, and unlink the spool file. For non-SMTP input
2970we can then give up. Note that for SMTP input we must swallow the remainder of
2971the input in cases of output errors, since the far end doesn't expect to see
2972anything until the terminating dot line is sent. */
2973
2974if (fflush(data_file) == EOF || ferror(data_file) ||
54fc8428 2975 EXIMfsync(fileno(data_file)) < 0 || (receive_ferror)())
059ec3d9
PH
2976 {
2977 uschar *msg_errno = US strerror(errno);
2978 BOOL input_error = (receive_ferror)() != 0;
2979 uschar *msg = string_sprintf("%s error (%s) while receiving message from %s",
2980 input_error? "Input read" : "Spool write",
2981 msg_errno,
2982 (sender_fullhost != NULL)? sender_fullhost : sender_ident);
2983
2984 log_write(0, LOG_MAIN, "Message abandoned: %s", msg);
2985 Uunlink(spool_name); /* Lose the data file */
2e5b33cd 2986 cancel_cutthrough_connection("error writing spoolfile");
059ec3d9
PH
2987
2988 if (smtp_input)
2989 {
2990 if (input_error)
2991 smtp_reply = US"451 Error while reading input data";
2992 else
2993 {
2994 smtp_reply = US"451 Error while writing spool file";
2995 receive_swallow_smtp();
2996 }
2997 message_id[0] = 0; /* Indicate no message accepted */
2998 goto TIDYUP; /* Skip to end of function */
2999 }
3000
3001 else
3002 {
3003 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3004 give_local_error(ERRMESS_IOERR, msg, US"", error_rc, data_file,
3005 header_list);
3006 /* Does not return */
3007 }
3008 }
3009
3010
3011/* No I/O errors were encountered while writing the data file. */
3012
3013DEBUG(D_receive) debug_printf("Data file written for message %s\n", message_id);
3014
3015
3016/* If there were any bad addresses extracted by -t, or there were no recipients
3017left after -t, send a message to the sender of this message, or write it to
3018stderr if the error handling option is set that way. Note that there may
3019legitimately be no recipients for an SMTP message if they have all been removed
3020by "discard".
3021
3022We need to rewind the data file in order to read it. In the case of no
3023recipients or stderr error writing, throw the data file away afterwards, and
3024exit. (This can't be SMTP, which always ensures there's at least one
3025syntactically good recipient address.) */
3026
3027if (extract_recip && (bad_addresses != NULL || recipients_count == 0))
3028 {
3029 DEBUG(D_receive)
3030 {
3031 if (recipients_count == 0) debug_printf("*** No recipients\n");
3032 if (bad_addresses != NULL)
3033 {
3034 error_block *eblock = bad_addresses;
3035 debug_printf("*** Bad address(es)\n");
3036 while (eblock != NULL)
3037 {
3038 debug_printf(" %s: %s\n", eblock->text1, eblock->text2);
3039 eblock = eblock->next;
3040 }
3041 }
3042 }
3043
3044 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3045
3046 /* If configured to send errors to the sender, but this fails, force
3047 a failure error code. We use a special one for no recipients so that it
3048 can be detected by the autoreply transport. Otherwise error_rc is set to
3049 errors_sender_rc, which is EXIT_FAILURE unless -oee was given, in which case
3050 it is EXIT_SUCCESS. */
3051
3052 if (error_handling == ERRORS_SENDER)
3053 {
3054 if (!moan_to_sender(
3055 (bad_addresses == NULL)?
3056 (extracted_ignored? ERRMESS_IGADDRESS : ERRMESS_NOADDRESS) :
3057 (recipients_list == NULL)? ERRMESS_BADNOADDRESS : ERRMESS_BADADDRESS,
3058 bad_addresses, header_list, data_file, FALSE))
3059 error_rc = (bad_addresses == NULL)? EXIT_NORECIPIENTS : EXIT_FAILURE;
3060 }
3061 else
3062 {
3063 if (bad_addresses == NULL)
3064 {
3065 if (extracted_ignored)
3066 fprintf(stderr, "exim: all -t recipients overridden by command line\n");
3067 else
3068 fprintf(stderr, "exim: no recipients in message\n");
3069 }
3070 else
3071 {
3072 fprintf(stderr, "exim: invalid address%s",
3073 (bad_addresses->next == NULL)? ":" : "es:\n");
3074 while (bad_addresses != NULL)
3075 {
3076 fprintf(stderr, " %s: %s\n", bad_addresses->text1,
3077 bad_addresses->text2);
3078 bad_addresses = bad_addresses->next;
3079 }
3080 }
3081 }
3082
3083 if (recipients_count == 0 || error_handling == ERRORS_STDERR)
3084 {
3085 Uunlink(spool_name);
f1e894f3 3086 (void)fclose(data_file);
059ec3d9
PH
3087 exim_exit(error_rc);
3088 }
3089 }
3090
3091/* Data file successfully written. Generate text for the Received: header by
3092expanding the configured string, and adding a timestamp. By leaving this
3093operation till now, we ensure that the timestamp is the time that message
3094reception was completed. However, this is deliberately done before calling the
3095data ACL and local_scan().
3096
3097This Received: header may therefore be inspected by the data ACL and by code in
3098the local_scan() function. When they have run, we update the timestamp to be
3099the final time of reception.
3100
3101If there is just one recipient, set up its value in the $received_for variable
3102for use when we generate the Received: header.
3103
3104Note: the checking for too many Received: headers is handled by the delivery
3105code. */
e4bdf652 3106/*XXX eventually add excess Received: check for cutthrough case back when classifying them */
059ec3d9 3107
e4bdf652 3108if (received_header->text == NULL) /* Non-cutthrough case */
059ec3d9 3109 {
e4bdf652 3110 received_header_gen();
059ec3d9 3111
e4bdf652 3112 /* Set the value of message_body_size for the DATA ACL and for local_scan() */
059ec3d9 3113
e4bdf652
JH
3114 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3115 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9 3116
e4bdf652
JH
3117 /* If an ACL from any RCPT commands set up any warning headers to add, do so
3118 now, before running the DATA ACL. */
059ec3d9 3119
e4bdf652
JH
3120 add_acl_headers(US"MAIL or RCPT");
3121 }
817d9f57 3122else
e4bdf652
JH
3123 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3124 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9
PH
3125
3126/* If an ACL is specified for checking things at this stage of reception of a
3127message, run it, unless all the recipients were removed by "discard" in earlier
3128ACLs. That is the only case in which recipients_count can be zero at this
3129stage. Set deliver_datafile to point to the data file so that $message_body and
3130$message_body_end can be extracted if needed. Allow $recipients in expansions.
3131*/
3132
3133deliver_datafile = data_fd;
4e88a19f 3134user_msg = NULL;
059ec3d9 3135
0e20aff9
MH
3136enable_dollar_recipients = TRUE;
3137
059ec3d9
PH
3138if (recipients_count == 0)
3139 {
3140 blackholed_by = recipients_discarded? US"MAIL ACL" : US"RCPT ACL";
3141 }
3142else
3143 {
059ec3d9
PH
3144 /* Handle interactive SMTP messages */
3145
3146 if (smtp_input && !smtp_batched_input)
3147 {
8523533c 3148
80a47a2c
TK
3149#ifndef DISABLE_DKIM
3150 if (!dkim_disable_verify)
3151 {
3152 /* Finish verification, this will log individual signature results to
3153 the mainlog */
3154 dkim_exim_verify_finish();
3155
3156 /* Check if we must run the DKIM ACL */
3157 if ((acl_smtp_dkim != NULL) &&
3158 (dkim_verify_signers != NULL) &&
3159 (dkim_verify_signers[0] != '\0'))
3160 {
3161 uschar *dkim_verify_signers_expanded =
3162 expand_string(dkim_verify_signers);
3163 if (dkim_verify_signers_expanded == NULL)
3164 {
3165 log_write(0, LOG_MAIN|LOG_PANIC,
3166 "expansion of dkim_verify_signers option failed: %s",
3167 expand_string_message);
3168 }
3169 else
3170 {
3171 int sep = 0;
3172 uschar *ptr = dkim_verify_signers_expanded;
3173 uschar *item = NULL;
9e5d6b55
TK
3174 uschar *seen_items = NULL;
3175 int seen_items_size = 0;
3176 int seen_items_offset = 0;
80a47a2c 3177 uschar itembuf[256];
9122af94
TK
3178 /* Default to OK when no items are present */
3179 rc = OK;
80a47a2c
TK
3180 while ((item = string_nextinlist(&ptr, &sep,
3181 itembuf,
3182 sizeof(itembuf))) != NULL)
3183 {
6119d1ea
TK
3184 /* Prevent running ACL for an empty item */
3185 if (!item || (item[0] == '\0')) continue;
9e5d6b55
TK
3186 /* Only run ACL once for each domain or identity, no matter how often it
3187 appears in the expanded list. */
6119d1ea
TK
3188 if (seen_items != NULL)
3189 {
ae9094bf
TK
3190 uschar *seen_item = NULL;
3191 uschar seen_item_buf[256];
4a73449b 3192 uschar *seen_items_list = seen_items;
ae9094bf 3193 int seen_this_item = 0;
61147df4 3194
ae9094bf
TK
3195 while ((seen_item = string_nextinlist(&seen_items_list, &sep,
3196 seen_item_buf,
3197 sizeof(seen_item_buf))) != NULL)
3198 {
3199 if (Ustrcmp(seen_item,item) == 0)
3200 {
3201 seen_this_item = 1;
3202 break;
61147df4 3203 }
ae9094bf
TK
3204 }
3205
3206 if (seen_this_item > 0)
6119d1ea
TK
3207 {
3208 DEBUG(D_receive)
3209 debug_printf("acl_smtp_dkim: skipping signer %s, already seen\n", item);
3210 continue;
3211 }
61147df4 3212
4a73449b 3213 seen_items = string_append(seen_items,&seen_items_size,&seen_items_offset,1,":");
6119d1ea
TK
3214 }
3215
4a73449b
TK
3216 seen_items = string_append(seen_items,&seen_items_size,&seen_items_offset,1,item);
3217 seen_items[seen_items_offset] = '\0';
6119d1ea
TK
3218
3219 DEBUG(D_receive)
3220 debug_printf("calling acl_smtp_dkim for dkim_cur_signer=%s\n", item);
3221
80a47a2c
TK
3222 dkim_exim_acl_setup(item);
3223 rc = acl_check(ACL_WHERE_DKIM, NULL, acl_smtp_dkim, &user_msg, &log_msg);
6119d1ea
TK
3224
3225 if (rc != OK)
3226 {
3227 DEBUG(D_receive)
3228 debug_printf("acl_smtp_dkim: acl_check returned %d on %s, skipping remaining items\n", rc, item);
2e5b33cd 3229 cancel_cutthrough_connection("dkim acl not ok");
6119d1ea
TK
3230 break;
3231 }
80a47a2c
TK
3232 }
3233 add_acl_headers(US"DKIM");
3234 if (rc == DISCARD)
3235 {
3236 recipients_count = 0;
3237 blackholed_by = US"DKIM ACL";
3238 if (log_msg != NULL)
3239 blackhole_log_msg = string_sprintf(": %s", log_msg);
3240 }
3241 else if (rc != OK)
3242 {
3243 Uunlink(spool_name);
3244 if (smtp_handle_acl_fail(ACL_WHERE_DKIM, rc, user_msg, log_msg) != 0)
3245 smtp_yield = FALSE; /* No more messsages after dropped connection */
3246 smtp_reply = US""; /* Indicate reply already sent */
3247 message_id[0] = 0; /* Indicate no message accepted */
3248 goto TIDYUP; /* Skip to end of function */
3249 }
3250 }
3251 }
3252 }
fb2274d4 3253
8523533c 3254#ifdef WITH_CONTENT_SCAN
80a47a2c
TK
3255 if (recipients_count > 0 &&
3256 acl_smtp_mime != NULL &&
54cdb463
PH
3257 !run_mime_acl(acl_smtp_mime, &smtp_yield, &smtp_reply, &blackholed_by))
3258 goto TIDYUP;
8523533c
TK
3259#endif /* WITH_CONTENT_SCAN */
3260
4840604e
TL
3261#ifdef EXPERIMENTAL_DMARC
3262 dmarc_up = dmarc_store_data(from_header);
3263#endif /* EXPERIMENTAL_DMARC */
3264
fd98a5c6
JH
3265#ifdef EXPERIMENTAL_PRDR
3266 if (prdr_requested && recipients_count > 1 && acl_smtp_data_prdr != NULL )
3267 {
3268 unsigned int c;
3269 int all_pass = OK;
3270 int all_fail = FAIL;
3271
3272 smtp_printf("353 PRDR content analysis beginning\r\n");
3273 /* Loop through recipients, responses must be in same order received */
3274 for (c = 0; recipients_count > c; c++)
3275 {
3276 uschar * addr= recipients_list[c].address;
3277 uschar * msg= US"PRDR R=<%s> %s";
3278 uschar * code;
3279 DEBUG(D_receive)
3280 debug_printf("PRDR processing recipient %s (%d of %d)\n",
3281 addr, c+1, recipients_count);
3282 rc = acl_check(ACL_WHERE_PRDR, addr,
3283 acl_smtp_data_prdr, &user_msg, &log_msg);
3284
3285 /* If any recipient rejected content, indicate it in final message */
3286 all_pass |= rc;
3287 /* If all recipients rejected, indicate in final message */
3288 all_fail &= rc;
3289
3290 switch (rc)
3291 {
3292 case OK: case DISCARD: code = US"250"; break;
3293 case DEFER: code = US"450"; break;
3294 default: code = US"550"; break;
3295 }
3296 if (user_msg != NULL)
3297 smtp_user_msg(code, user_msg);
3298 else
3299 {
3300 switch (rc)
3301 {
3302 case OK: case DISCARD:
3303 msg = string_sprintf(CS msg, addr, "acceptance"); break;
3304 case DEFER:
3305 msg = string_sprintf(CS msg, addr, "temporary refusal"); break;
3306 default:
3307 msg = string_sprintf(CS msg, addr, "refusal"); break;
3308 }
3309 smtp_user_msg(code, msg);
3310 }
3311 if (log_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, log_msg);
3312 else if (user_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, user_msg);
3313 else log_write(0, LOG_MAIN, CS msg);
3314
3315 if (rc != OK) { receive_remove_recipient(addr); c--; }
3316 }
3317 /* Set up final message, used if data acl gives OK */
3318 smtp_reply = string_sprintf("%s id=%s message %s",
3319 all_fail == FAIL ? US"550" : US"250",
3320 message_id,
3321 all_fail == FAIL
3322 ? US"rejected for all recipients"
3323 : all_pass == OK
3324 ? US"accepted"
3325 : US"accepted for some recipients");
3326 if (recipients_count == 0)
3327 {
3328 message_id[0] = 0; /* Indicate no message accepted */
3329 goto TIDYUP;
3330 }
3331 }
3332 else
3333 prdr_requested = FALSE;
3334#endif /* EXPERIMENTAL_PRDR */
3335
54cdb463
PH
3336 /* Check the recipients count again, as the MIME ACL might have changed
3337 them. */
8523533c 3338
059ec3d9
PH
3339 if (acl_smtp_data != NULL && recipients_count > 0)
3340 {
059ec3d9
PH
3341 rc = acl_check(ACL_WHERE_DATA, NULL, acl_smtp_data, &user_msg, &log_msg);
3342 add_acl_headers(US"DATA");
3343 if (rc == DISCARD)
3344 {
3345 recipients_count = 0;
3346 blackholed_by = US"DATA ACL";
8e669ac1
PH
3347 if (log_msg != NULL)
3348 blackhole_log_msg = string_sprintf(": %s", log_msg);
2e5b33cd 3349 cancel_cutthrough_connection("data acl discard");
059ec3d9
PH
3350 }
3351 else if (rc != OK)
3352 {
3353 Uunlink(spool_name);
2e5b33cd 3354 cancel_cutthrough_connection("data acl not ok");
8523533c
TK
3355#ifdef WITH_CONTENT_SCAN
3356 unspool_mbox();
6f0c431a
PP
3357#endif
3358#ifdef EXPERIMENTAL_DCC
3359 dcc_ok = 0;
8523533c 3360#endif
059ec3d9
PH
3361 if (smtp_handle_acl_fail(ACL_WHERE_DATA, rc, user_msg, log_msg) != 0)
3362 smtp_yield = FALSE; /* No more messsages after dropped connection */
3363 smtp_reply = US""; /* Indicate reply already sent */
3364 message_id[0] = 0; /* Indicate no message accepted */
3365 goto TIDYUP; /* Skip to end of function */
3366 }
3367 }
3368 }
3369
3370 /* Handle non-SMTP and batch SMTP (i.e. non-interactive) messages. Note that
3371 we cannot take different actions for permanent and temporary rejections. */
3372
54cdb463 3373 else
059ec3d9 3374 {
54cdb463
PH
3375
3376#ifdef WITH_CONTENT_SCAN
3377 if (acl_not_smtp_mime != NULL &&
3378 !run_mime_acl(acl_not_smtp_mime, &smtp_yield, &smtp_reply,
3379 &blackholed_by))
3380 goto TIDYUP;
3381#endif /* WITH_CONTENT_SCAN */
3382
3383 if (acl_not_smtp != NULL)
059ec3d9 3384 {
54cdb463
PH
3385 uschar *user_msg, *log_msg;
3386 rc = acl_check(ACL_WHERE_NOTSMTP, NULL, acl_not_smtp, &user_msg, &log_msg);
3387 if (rc == DISCARD)
059ec3d9 3388 {
54cdb463
PH
3389 recipients_count = 0;
3390 blackholed_by = US"non-SMTP ACL";
3391 if (log_msg != NULL)
3392 blackhole_log_msg = string_sprintf(": %s", log_msg);
059ec3d9 3393 }
54cdb463 3394 else if (rc != OK)
059ec3d9 3395 {
54cdb463
PH
3396 Uunlink(spool_name);
3397#ifdef WITH_CONTENT_SCAN
3398 unspool_mbox();
6f0c431a
PP
3399#endif
3400#ifdef EXPERIMENTAL_DCC
3401 dcc_ok = 0;
54cdb463 3402#endif
6ea85e9a
PH
3403 /* The ACL can specify where rejections are to be logged, possibly
3404 nowhere. The default is main and reject logs. */
3405
3406 if (log_reject_target != 0)
3407 log_write(0, log_reject_target, "F=<%s> rejected by non-SMTP ACL: %s",
3408 sender_address, log_msg);
3409
54cdb463
PH
3410 if (user_msg == NULL) user_msg = US"local configuration problem";
3411 if (smtp_batched_input)
3412 {
3413 moan_smtp_batch(NULL, "%d %s", 550, user_msg);
3414 /* Does not return */
3415 }
3416 else
3417 {
3418 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3419 give_local_error(ERRMESS_LOCAL_ACL, user_msg,
3420 US"message rejected by non-SMTP ACL: ", error_rc, data_file,
3421 header_list);
3422 /* Does not return */
3423 }
059ec3d9 3424 }
54cdb463 3425 add_acl_headers(US"non-SMTP");
059ec3d9 3426 }
059ec3d9
PH
3427 }
3428
4840604e
TL
3429#endif /* DISABLE_DKIM */
3430
54cdb463
PH
3431 /* The applicable ACLs have been run */
3432
059ec3d9
PH
3433 if (deliver_freeze) frozen_by = US"ACL"; /* for later logging */
3434 if (queue_only_policy) queued_by = US"ACL";
059ec3d9
PH
3435 }
3436
8523533c
TK
3437#ifdef WITH_CONTENT_SCAN
3438unspool_mbox();
3439#endif
3440
6a8f9482
TK
3441#ifdef EXPERIMENTAL_DCC
3442dcc_ok = 0;
3443#endif
3444
3445
059ec3d9
PH
3446/* The final check on the message is to run the scan_local() function. The
3447version supplied with Exim always accepts, but this is a hook for sysadmins to
3448supply their own checking code. The local_scan() function is run even when all
3449the recipients have been discarded. */
3450
3451lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3452
3453/* Arrange to catch crashes in local_scan(), so that the -D file gets
3454deleted, and the incident gets logged. */
3455
3456os_non_restarting_signal(SIGSEGV, local_scan_crash_handler);
3457os_non_restarting_signal(SIGFPE, local_scan_crash_handler);
3458os_non_restarting_signal(SIGILL, local_scan_crash_handler);
3459os_non_restarting_signal(SIGBUS, local_scan_crash_handler);
3460
3461DEBUG(D_receive) debug_printf("calling local_scan(); timeout=%d\n",
3462 local_scan_timeout);
3463local_scan_data = NULL;
3464
3465os_non_restarting_signal(SIGALRM, local_scan_timeout_handler);
3466if (local_scan_timeout > 0) alarm(local_scan_timeout);
3467rc = local_scan(data_fd, &local_scan_data);
3468alarm(0);
3469os_non_restarting_signal(SIGALRM, sigalrm_handler);
3470
0e20aff9
MH
3471enable_dollar_recipients = FALSE;
3472
059ec3d9
PH
3473store_pool = POOL_MAIN; /* In case changed */
3474DEBUG(D_receive) debug_printf("local_scan() returned %d %s\n", rc,
3475 local_scan_data);
3476
3477os_non_restarting_signal(SIGSEGV, SIG_DFL);
3478os_non_restarting_signal(SIGFPE, SIG_DFL);
3479os_non_restarting_signal(SIGILL, SIG_DFL);
3480os_non_restarting_signal(SIGBUS, SIG_DFL);
3481
3482/* The length check is paranoia against some runaway code, and also because
3483(for a success return) lines in the spool file are read into big_buffer. */
3484
3485if (local_scan_data != NULL)
3486 {
3487 int len = Ustrlen(local_scan_data);
3488 if (len > LOCAL_SCAN_MAX_RETURN) len = LOCAL_SCAN_MAX_RETURN;
3489 local_scan_data = string_copyn(local_scan_data, len);
3490 }
3491
3492if (rc == LOCAL_SCAN_ACCEPT_FREEZE)
3493 {
58eb016e 3494 if (!deliver_freeze) /* ACL might have already frozen */
059ec3d9
PH
3495 {
3496 deliver_freeze = TRUE;
3497 deliver_frozen_at = time(NULL);
3498 frozen_by = US"local_scan()";
3499 }
3500 rc = LOCAL_SCAN_ACCEPT;
3501 }
3502else if (rc == LOCAL_SCAN_ACCEPT_QUEUE)
3503 {
3504 if (!queue_only_policy) /* ACL might have already queued */
3505 {
3506 queue_only_policy = TRUE;
3507 queued_by = US"local_scan()";
3508 }
3509 rc = LOCAL_SCAN_ACCEPT;
3510 }
3511
3512/* Message accepted: remove newlines in local_scan_data because otherwise
3513the spool file gets corrupted. Ensure that all recipients are qualified. */
3514
3515if (rc == LOCAL_SCAN_ACCEPT)
3516 {
3517 if (local_scan_data != NULL)
3518 {
3519 uschar *s;
3520 for (s = local_scan_data; *s != 0; s++) if (*s == '\n') *s = ' ';
3521 }
3522 for (i = 0; i < recipients_count; i++)
3523 {
3524 recipient_item *r = recipients_list + i;
3525 r->address = rewrite_address_qualify(r->address, TRUE);
3526 if (r->errors_to != NULL)
3527 r->errors_to = rewrite_address_qualify(r->errors_to, TRUE);
3528 }
3529 if (recipients_count == 0 && blackholed_by == NULL)
3530 blackholed_by = US"local_scan";
3531 }
3532
3533/* Message rejected: newlines permitted in local_scan_data to generate
3534multiline SMTP responses. */
3535
3536else
3537 {
3538 uschar *istemp = US"";
3539 uschar *s = NULL;
a5bd321b 3540 uschar *smtp_code;
059ec3d9
PH
3541 int size = 0;
3542 int sptr = 0;
059ec3d9
PH
3543
3544 errmsg = local_scan_data;
3545
3546 Uunlink(spool_name); /* Cancel this message */
3547 switch(rc)
3548 {
3549 default:
3550 log_write(0, LOG_MAIN, "invalid return %d from local_scan(). Temporary "
3551 "rejection given", rc);
3552 goto TEMPREJECT;
3553
3554 case LOCAL_SCAN_REJECT_NOLOGHDR:
3555 log_extra_selector &= ~LX_rejected_header;
3556 /* Fall through */
3557
3558 case LOCAL_SCAN_REJECT:
a5bd321b 3559 smtp_code = US"550";
059ec3d9
PH
3560 if (errmsg == NULL) errmsg = US"Administrative prohibition";
3561 break;
3562
3563 case LOCAL_SCAN_TEMPREJECT_NOLOGHDR:
3564 log_extra_selector &= ~LX_rejected_header;
3565 /* Fall through */
3566
3567 case LOCAL_SCAN_TEMPREJECT:
3568 TEMPREJECT:
a5bd321b 3569 smtp_code = US"451";
059ec3d9
PH
3570 if (errmsg == NULL) errmsg = US"Temporary local problem";
3571 istemp = US"temporarily ";
3572 break;
3573 }
3574
3575 s = string_append(s, &size, &sptr, 2, US"F=",
3576 (sender_address[0] == 0)? US"<>" : sender_address);
3577 s = add_host_info_for_log(s, &size, &sptr);
3578 s[sptr] = 0;
3579
3580 log_write(0, LOG_MAIN|LOG_REJECT, "%s %srejected by local_scan(): %.256s",
3581 s, istemp, string_printing(errmsg));
3582
3583 if (smtp_input)
3584 {
3585 if (!smtp_batched_input)
3586 {
a5bd321b 3587 smtp_respond(smtp_code, 3, TRUE, errmsg);
059ec3d9
PH
3588 message_id[0] = 0; /* Indicate no message accepted */
3589 smtp_reply = US""; /* Indicate reply already sent */
3590 goto TIDYUP; /* Skip to end of function */
3591 }
3592 else
3593 {
a5bd321b 3594 moan_smtp_batch(NULL, "%s %s", smtp_code, errmsg);
059ec3d9
PH
3595 /* Does not return */
3596 }
3597 }
3598 else
3599 {
3600 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3601 give_local_error(ERRMESS_LOCAL_SCAN, errmsg,
3602 US"message rejected by local scan code: ", error_rc, data_file,
3603 header_list);
3604 /* Does not return */
3605 }
3606 }
3607
3608/* Reset signal handlers to ignore signals that previously would have caused
3609the message to be abandoned. */
3610
3611signal(SIGTERM, SIG_IGN);
3612signal(SIGINT, SIG_IGN);
3613
e4bdf652 3614
059ec3d9
PH
3615/* Ensure the first time flag is set in the newly-received message. */
3616
3617deliver_firsttime = TRUE;
3618
8523533c
TK
3619#ifdef EXPERIMENTAL_BRIGHTMAIL
3620if (bmi_run == 1) {
3621 /* rewind data file */
3622 lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3623 bmi_verdicts = bmi_process_message(header_list, data_fd);
3624};
3625#endif
3626
059ec3d9
PH
3627/* Update the timstamp in our Received: header to account for any time taken by
3628an ACL or by local_scan(). The new time is the time that all reception
3629processing is complete. */
3630
3631timestamp = expand_string(US"${tod_full}");
3632tslen = Ustrlen(timestamp);
3633
3634memcpy(received_header->text + received_header->slen - tslen - 1,
3635 timestamp, tslen);
3636
3637/* In MUA wrapper mode, ignore queueing actions set by ACL or local_scan() */
3638
3639if (mua_wrapper)
3640 {
3641 deliver_freeze = FALSE;
3642 queue_only_policy = FALSE;
3643 }
3644
3645/* Keep the data file open until we have written the header file, in order to
3646hold onto the lock. In a -bh run, or if the message is to be blackholed, we
3647don't write the header file, and we unlink the data file. If writing the header
3648file fails, we have failed to accept this message. */
3649
3650if (host_checking || blackholed_by != NULL)
3651 {
3652 header_line *h;
3653 Uunlink(spool_name);
3654 msg_size = 0; /* Compute size for log line */
3655 for (h = header_list; h != NULL; h = h->next)
3656 if (h->type != '*') msg_size += h->slen;
3657 }
3658
3659/* Write the -H file */
3660
3661else
3662 {
3663 if ((msg_size = spool_write_header(message_id, SW_RECEIVING, &errmsg)) < 0)
3664 {
3665 log_write(0, LOG_MAIN, "Message abandoned: %s", errmsg);
3666 Uunlink(spool_name); /* Lose the data file */
3667
3668 if (smtp_input)
3669 {
3670 smtp_reply = US"451 Error in writing spool file";
3671 message_id[0] = 0; /* Indicate no message accepted */
3672 goto TIDYUP;
3673 }
3674 else
3675 {
3676 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3677 give_local_error(ERRMESS_IOERR, errmsg, US"", error_rc, data_file,
3678 header_list);
3679 /* Does not return */
3680 }
3681 }
3682 }
3683
3684
3685/* The message has now been successfully received. */
3686
3687receive_messagecount++;
3688
3689/* In SMTP sessions we may receive several in one connection. After each one,
3690we wait for the clock to tick at the level of message-id granularity. This is
3691so that the combination of time+pid is unique, even on systems where the pid
3692can be re-used within our time interval. We can't shorten the interval without
3693re-designing the message-id. See comments above where the message id is
3694created. This is Something For The Future. */
3695
3696message_id_tv.tv_usec = (message_id_tv.tv_usec/id_resolution) * id_resolution;
3697exim_wait_tick(&message_id_tv, id_resolution);
3698
3699/* Add data size to written header size. We do not count the initial file name
3700that is in the file, but we do add one extra for the notional blank line that
3701precedes the data. This total differs from message_size in that it include the
3702added Received: header and any other headers that got created locally. */
3703
3704fflush(data_file);
3705fstat(data_fd, &statbuf);
3706
3707msg_size += statbuf.st_size - SPOOL_DATA_START_OFFSET + 1;
3708
3709/* Generate a "message received" log entry. We do this by building up a dynamic
3710string as required. Since we commonly want to add two items at a time, use a
3711macro to simplify the coding. We log the arrival of a new message while the
3712file is still locked, just in case the machine is *really* fast, and delivers
3713it first! Include any message id that is in the message - since the syntax of a
3714message id is actually an addr-spec, we can use the parse routine to canonicize
3715it. */
3716
3717size = 256;
3718sptr = 0;
3719s = store_get(size);
3720
3721s = string_append(s, &size, &sptr, 2, US"<= ",
3722 (sender_address[0] == 0)? US"<>" : sender_address);
3723if (message_reference != NULL)
3724 s = string_append(s, &size, &sptr, 2, US" R=", message_reference);
3725
3726s = add_host_info_for_log(s, &size, &sptr);
3727
3728#ifdef SUPPORT_TLS
817d9f57
JH
3729if ((log_extra_selector & LX_tls_cipher) != 0 && tls_in.cipher != NULL)
3730 s = string_append(s, &size, &sptr, 2, US" X=", tls_in.cipher);
059ec3d9 3731if ((log_extra_selector & LX_tls_certificate_verified) != 0 &&
817d9f57 3732 tls_in.cipher != NULL)
059ec3d9 3733 s = string_append(s, &size, &sptr, 2, US" CV=",
817d9f57
JH
3734 tls_in.certificate_verified? "yes":"no");
3735if ((log_extra_selector & LX_tls_peerdn) != 0 && tls_in.peerdn != NULL)
48ed62d9 3736 s = string_append(s, &size, &sptr, 3, US" DN=\"",
817d9f57
JH
3737 string_printing(tls_in.peerdn), US"\"");
3738if ((log_extra_selector & LX_tls_sni) != 0 && tls_in.sni != NULL)
3f0945ff 3739 s = string_append(s, &size, &sptr, 3, US" SNI=\"",
817d9f57 3740 string_printing(tls_in.sni), US"\"");
3f0945ff 3741#endif
059ec3d9
PH
3742
3743if (sender_host_authenticated != NULL)
3744 {
3745 s = string_append(s, &size, &sptr, 2, US" A=", sender_host_authenticated);
3746 if (authenticated_id != NULL)
c8e2fc1e 3747 {
059ec3d9 3748 s = string_append(s, &size, &sptr, 2, US":", authenticated_id);
c8e2fc1e
JH
3749 if (log_extra_selector & LX_smtp_mailauth && authenticated_sender != NULL)
3750 s = string_append(s, &size, &sptr, 2, US":", authenticated_sender);
3751 }
059ec3d9
PH
3752 }
3753
fd98a5c6
JH
3754#ifdef EXPERIMENTAL_PRDR
3755if (prdr_requested)
3756 s = string_append(s, &size, &sptr, 1, US" PRDR");
3757#endif
3758
059ec3d9
PH
3759sprintf(CS big_buffer, "%d", msg_size);
3760s = string_append(s, &size, &sptr, 2, US" S=", big_buffer);
3761
3c0a92dc
JH
3762/* log 8BITMIME mode announced in MAIL_FROM
3763 0 ... no BODY= used
3764 7 ... 7BIT
3765 8 ... 8BITMIME */
c8e2fc1e
JH
3766if (log_extra_selector & LX_8bitmime)
3767 {
3c0a92dc
JH
3768 sprintf(CS big_buffer, "%d", body_8bitmime);
3769 s = string_append(s, &size, &sptr, 2, US" M8S=", big_buffer);
c8e2fc1e 3770 }
3c0a92dc 3771
059ec3d9
PH
3772/* If an addr-spec in a message-id contains a quoted string, it can contain
3773any characters except " \ and CR and so in particular it can contain NL!
3774Therefore, make sure we use a printing-characters only version for the log.
3775Also, allow for domain literals in the message id. */
3776
3777if (msgid_header != NULL)
3778 {
3779 uschar *old_id;
3780 BOOL save_allow_domain_literals = allow_domain_literals;
3781 allow_domain_literals = TRUE;
3782 old_id = parse_extract_address(Ustrchr(msgid_header->text, ':') + 1,
3783 &errmsg, &start, &end, &domain, FALSE);
3784 allow_domain_literals = save_allow_domain_literals;
3785 if (old_id != NULL)
3786 s = string_append(s, &size, &sptr, 2, US" id=", string_printing(old_id));
3787 }
3788
3789/* If subject logging is turned on, create suitable printing-character
3790text. By expanding $h_subject: we make use of the MIME decoding. */
3791
3792if ((log_extra_selector & LX_subject) != 0 && subject_header != NULL)
3793 {
3794 int i;
3795 uschar *p = big_buffer;
3796 uschar *ss = expand_string(US"$h_subject:");
3797
3798 /* Backslash-quote any double quotes or backslashes so as to make a
3799 a C-like string, and turn any non-printers into escape sequences. */
3800
3801 *p++ = '\"';
3802 if (*ss != 0) for (i = 0; i < 100 && ss[i] != 0; i++)
3803 {
3804 if (ss[i] == '\"' || ss[i] == '\\') *p++ = '\\';
3805 *p++ = ss[i];
3806 }
3807 *p++ = '\"';
3808 *p = 0;
3809 s = string_append(s, &size, &sptr, 2, US" T=", string_printing(big_buffer));
3810 }
3811
3812/* Terminate the string: string_cat() and string_append() leave room, but do
3813not put the zero in. */
3814
3815s[sptr] = 0;
3816
059ec3d9
PH
3817/* Create a message log file if message logs are being used and this message is
3818not blackholed. Write the reception stuff to it. We used to leave message log
e4bdf652 3819creation until the first delivery, but this has proved confusing for some
059ec3d9
PH
3820people. */
3821
3822if (message_logs && blackholed_by == NULL)
3823 {
3824 int fd;
3825
3826 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory, message_subdir,
3827 message_id);
3828 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3829
3830 if (fd < 0 && errno == ENOENT)
3831 {
3832 uschar temp[16];
3833 sprintf(CS temp, "msglog/%s", message_subdir);
3834 if (message_subdir[0] == 0) temp[6] = 0;
3835 (void)directory_make(spool_directory, temp, MSGLOG_DIRECTORY_MODE, TRUE);
3836 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3837 }
3838
3839 if (fd < 0)
3840 {
3841 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't open message log %s: %s",
3842 spool_name, strerror(errno));
3843 }
3844
3845 else
3846 {
3847 FILE *message_log = fdopen(fd, "a");
3848 if (message_log == NULL)
3849 {
3850 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't fdopen message log %s: %s",
3851 spool_name, strerror(errno));
f1e894f3 3852 (void)close(fd);
059ec3d9
PH
3853 }
3854 else
3855 {
3856 uschar *now = tod_stamp(tod_log);
3857 fprintf(message_log, "%s Received from %s\n", now, s+3);
3858 if (deliver_freeze) fprintf(message_log, "%s frozen by %s\n", now,
3859 frozen_by);
3860 if (queue_only_policy) fprintf(message_log,
3861 "%s no immediate delivery: queued by %s\n", now, queued_by);
f1e894f3 3862 (void)fclose(message_log);
059ec3d9
PH
3863 }
3864 }
3865 }
3866
58eb016e
PH
3867/* Everything has now been done for a successful message except logging its
3868arrival, and outputting an SMTP response. While writing to the log, set a flag
3869to cause a call to receive_bomb_out() if the log cannot be opened. */
3870
3871receive_call_bombout = TRUE;
3872
563b63fa
PH
3873/* Before sending an SMTP response in a TCP/IP session, we check to see if the
3874connection has gone away. This can only be done if there is no unconsumed input
3875waiting in the local input buffer. We can test for this by calling
3876receive_smtp_buffered(). RFC 2920 (pipelining) explicitly allows for additional
3877input to be sent following the final dot, so the presence of following input is
3878not an error.
58eb016e 3879
563b63fa
PH
3880If the connection is still present, but there is no unread input for the
3881socket, the result of a select() call will be zero. If, however, the connection
3882has gone away, or if there is pending input, the result of select() will be
3883non-zero. The two cases can be distinguished by trying to read the next input
3884character. If we succeed, we can unread it so that it remains in the local
3885buffer for handling later. If not, the connection has been lost.
58eb016e 3886
563b63fa
PH
3887Of course, since TCP/IP is asynchronous, there is always a chance that the
3888connection will vanish between the time of this test and the sending of the
3889response, but the chance of this happening should be small. */
3890
3891if (smtp_input && sender_host_address != NULL && !sender_host_notsocket &&
3892 !receive_smtp_buffered())
58eb016e
PH
3893 {
3894 struct timeval tv;
3895 fd_set select_check;
3896 FD_ZERO(&select_check);
3897 FD_SET(fileno(smtp_in), &select_check);
3898 tv.tv_sec = 0;
3899 tv.tv_usec = 0;
3900
563b63fa 3901 if (select(fileno(smtp_in) + 1, &select_check, NULL, NULL, &tv) != 0)
58eb016e 3902 {
80a47a2c
TK
3903 int c = (receive_getc)();
3904 if (c != EOF) (receive_ungetc)(c); else
58eb016e 3905 {
563b63fa
PH
3906 uschar *msg = US"SMTP connection lost after final dot";
3907 smtp_reply = US""; /* No attempt to send a response */
3908 smtp_yield = FALSE; /* Nothing more on this connection */
58eb016e 3909
563b63fa 3910 /* Re-use the log line workspace */
58eb016e 3911
563b63fa
PH
3912 sptr = 0;
3913 s = string_cat(s, &size, &sptr, msg, Ustrlen(msg));
3914 s = add_host_info_for_log(s, &size, &sptr);
3915 s[sptr] = 0;
3916 log_write(0, LOG_MAIN, "%s", s);
58eb016e 3917
563b63fa 3918 /* Delete the files for this aborted message. */
58eb016e 3919
563b63fa
PH
3920 sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory,
3921 message_subdir, message_id);
3922 Uunlink(spool_name);
58eb016e 3923
563b63fa
PH
3924 sprintf(CS spool_name, "%s/input/%s/%s-H", spool_directory,
3925 message_subdir, message_id);
3926 Uunlink(spool_name);
58eb016e 3927
563b63fa
PH
3928 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory,
3929 message_subdir, message_id);
3930 Uunlink(spool_name);
58eb016e 3931
563b63fa
PH
3932 goto TIDYUP;
3933 }
58eb016e
PH
3934 }
3935 }
3936
3937/* The connection has not gone away; we really are going to take responsibility
3938for this message. */
3939
817d9f57 3940/* Cutthrough - had sender last-dot; assume we've sent (or bufferred) all
e4bdf652
JH
3941 data onward by now.
3942
817d9f57 3943 Send dot onward. If accepted, wipe the spooled files, log as delivered and accept
e4bdf652 3944 the sender's dot (below).
817d9f57
JH
3945 If rejected: copy response to sender, wipe the spooled files, log approriately.
3946 If temp-reject: accept to sender, keep the spooled files.
e4bdf652
JH
3947
3948 Having the normal spool files lets us do data-filtering, and store/forward on temp-reject.
817d9f57
JH
3949
3950 XXX We do not handle queue-only, freezing, or blackholes.
e4bdf652 3951*/
6d9cfc47 3952cutthrough_done = 0;
e4bdf652
JH
3953if(cutthrough_fd >= 0)
3954 {
3955 uschar * msg= cutthrough_finaldot(); /* Ask the target system to accept the messsage */
817d9f57 3956 /* Logging was done in finaldot() */
e4bdf652 3957 switch(msg[0])
817d9f57
JH
3958 {
3959 case '2': /* Accept. Do the same to the source; dump any spoolfiles. */
3960 cutthrough_done = 3;
3961 break; /* message_id needed for SMTP accept below */
61147df4 3962
817d9f57
JH
3963 default: /* Unknown response, or error. Treat as temp-reject. */
3964 case '4': /* Temp-reject. Keep spoolfiles and accept. */
3965 cutthrough_done = 1; /* Avoid the usual immediate delivery attempt */
3966 break; /* message_id needed for SMTP accept below */
61147df4 3967
817d9f57
JH
3968 case '5': /* Perm-reject. Do the same to the source. Dump any spoolfiles */
3969 smtp_reply= msg; /* Pass on the exact error */
3970 cutthrough_done = 2;
3971 break;
3972 }
e4bdf652 3973 }
58eb016e 3974
fd98a5c6
JH
3975if(smtp_reply == NULL
3976#ifdef EXPERIMENTAL_PRDR
3977 || prdr_requested
3978#endif
3979 )
e4bdf652
JH
3980 {
3981 log_write(0, LOG_MAIN |
3982 (((log_extra_selector & LX_received_recipients) != 0)? LOG_RECIPIENTS : 0) |
3983 (((log_extra_selector & LX_received_sender) != 0)? LOG_SENDER : 0),
3984 "%s", s);
3985
3986 /* Log any control actions taken by an ACL or local_scan(). */
58eb016e 3987
e4bdf652
JH
3988 if (deliver_freeze) log_write(0, LOG_MAIN, "frozen by %s", frozen_by);
3989 if (queue_only_policy) log_write(L_delay_delivery, LOG_MAIN,
3990 "no immediate delivery: queued by %s", queued_by);
3991 }
3992receive_call_bombout = FALSE;
58eb016e 3993
059ec3d9
PH
3994store_reset(s); /* The store for the main log message can be reused */
3995
3996/* If the message is frozen, and freeze_tell is set, do the telling. */
3997
3998if (deliver_freeze && freeze_tell != NULL && freeze_tell[0] != 0)
3999 {
4000 moan_tell_someone(freeze_tell, NULL, US"Message frozen on arrival",
4001 "Message %s was frozen on arrival by %s.\nThe sender is <%s>.\n",
4002 message_id, frozen_by, sender_address);
4003 }
4004
4005
4006/* Either a message has been successfully received and written to the two spool
4007files, or an error in writing the spool has occurred for an SMTP message, or
58eb016e
PH
4008an SMTP message has been rejected for policy reasons. (For a non-SMTP message
4009we will have already given up because there's no point in carrying on!) In
4010either event, we must now close (and thereby unlock) the data file. In the
059ec3d9
PH
4011successful case, this leaves the message on the spool, ready for delivery. In
4012the error case, the spool file will be deleted. Then tidy up store, interact
4013with an SMTP call if necessary, and return.
4014
4015A fflush() was done earlier in the expectation that any write errors on the
4016data file will be flushed(!) out thereby. Nevertheless, it is theoretically
4017possible for fclose() to fail - but what to do? What has happened to the lock
4018if this happens? */
4019
e4bdf652 4020
059ec3d9 4021TIDYUP:
f1e894f3
PH
4022process_info[process_info_len] = 0; /* Remove message id */
4023if (data_file != NULL) (void)fclose(data_file); /* Frees the lock */
059ec3d9
PH
4024
4025/* Now reset signal handlers to their defaults */
4026
4027signal(SIGTERM, SIG_DFL);
4028signal(SIGINT, SIG_DFL);
4029
4030/* Tell an SMTP caller the state of play, and arrange to return the SMTP return
4031value, which defaults TRUE - meaning there may be more incoming messages from
4032this connection. For non-SMTP callers (where there is only ever one message),
4033the default is FALSE. */
4034
4035if (smtp_input)
4036 {
4037 yield = smtp_yield;
4038
4039 /* Handle interactive SMTP callers. After several kinds of error, smtp_reply
58eb016e
PH
4040 is set to the response that should be sent. When it is NULL, we generate
4041 default responses. After an ACL error or local_scan() error, the response has
4042 already been sent, and smtp_reply is an empty string to indicate this. */
059ec3d9
PH
4043
4044 if (!smtp_batched_input)
4045 {
4046 if (smtp_reply == NULL)
4047 {
29aba418 4048 if (fake_response != OK)
a5bd321b
PH
4049 smtp_respond((fake_response == DEFER)? US"450" : US"550", 3, TRUE,
4050 fake_response_text);
4e88a19f
PH
4051
4052 /* An OK response is required; use "message" text if present. */
4053
4054 else if (user_msg != NULL)
4055 {
4056 uschar *code = US"250";
4057 int len = 3;
4058 smtp_message_code(&code, &len, &user_msg, NULL);
4059 smtp_respond(code, len, TRUE, user_msg);
4060 }
4061
4062 /* Default OK response */
4063
8e669ac1
PH
4064 else
4065 smtp_printf("250 OK id=%s\r\n", message_id);
059ec3d9
PH
4066 if (host_checking)
4067 fprintf(stdout,
4068 "\n**** SMTP testing: that is not a real message id!\n\n");
4069 }
4e88a19f 4070
58eb016e 4071 /* smtp_reply is set non-empty */
4e88a19f 4072
8523533c
TK
4073 else if (smtp_reply[0] != 0)
4074 {
29aba418 4075 if (fake_response != OK && (smtp_reply[0] == '2'))
a5bd321b
PH
4076 smtp_respond((fake_response == DEFER)? US"450" : US"550", 3, TRUE,
4077 fake_response_text);
8e669ac1 4078 else
6951ac6c
PH
4079 smtp_printf("%.1024s\r\n", smtp_reply);
4080 }
e4bdf652 4081
817d9f57
JH
4082 switch (cutthrough_done)
4083 {
4084 case 3: log_write(0, LOG_MAIN, "Completed"); /* Delivery was done */
4085 case 2: { /* Delete spool files */
4086 sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory,
4087 message_subdir, message_id);
4088 Uunlink(spool_name);
4089 sprintf(CS spool_name, "%s/input/%s/%s-H", spool_directory,
4090 message_subdir, message_id);
4091 Uunlink(spool_name);
4092 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory,
4093 message_subdir, message_id);
4094 Uunlink(spool_name);
4095 }
4096 case 1: message_id[0] = 0; /* Prevent a delivery from starting */
4097 default:break;
e4bdf652 4098 }
817d9f57 4099 cutthrough_delivery = FALSE;
059ec3d9
PH
4100 }
4101
4102 /* For batched SMTP, generate an error message on failure, and do
4103 nothing on success. The function moan_smtp_batch() does not return -
4104 it exits from the program with a non-zero return code. */
4105
4106 else if (smtp_reply != NULL) moan_smtp_batch(NULL, "%s", smtp_reply);
4107 }
4108
4109
4110/* If blackholing, we can immediately log this message's sad fate. The data
4111file has already been unlinked, and the header file was never written to disk.
4112We must now indicate that nothing was received, to prevent a delivery from
4113starting. */
4114
4115if (blackholed_by != NULL)
4116 {
4117 uschar *detail = (local_scan_data != NULL)?
4118 string_printing(local_scan_data) :
4119 string_sprintf("(%s discarded recipients)", blackholed_by);
04f7d5b9 4120 log_write(0, LOG_MAIN, "=> blackhole %s%s", detail, blackhole_log_msg);
059ec3d9
PH
4121 log_write(0, LOG_MAIN, "Completed");
4122 message_id[0] = 0;
4123 }
4124
4125/* Reset headers so that logging of rejects for a subsequent message doesn't
4126include them. It is also important to set header_last = NULL before exiting
4127from this function, as this prevents certain rewrites that might happen during
4128subsequent verifying (of another incoming message) from trying to add headers
4129when they shouldn't. */
4130
4131header_list = header_last = NULL;
4132
4133return yield; /* TRUE if more messages (SMTP only) */
4134}
4135
4136/* End of receive.c */