Handle recursion better, caused by ACLs.
[exim.git] / src / src / receive.c
CommitLineData
059ec3d9
PH
1/*************************************************
2* Exim - an Internet mail transport agent *
3*************************************************/
4
c4ceed07 5/* Copyright (c) University of Cambridge 1995 - 2012 */
059ec3d9
PH
6/* See the file NOTICE for conditions of use and distribution. */
7
8/* Code for receiving a message and setting up spool files. */
9
059ec3d9
PH
10#include "exim.h"
11
6a8f9482
TK
12#ifdef EXPERIMENTAL_DCC
13extern int dcc_ok;
14#endif
15
059ec3d9
PH
16/*************************************************
17* Local static variables *
18*************************************************/
19
20static FILE *data_file = NULL;
21static int data_fd = -1;
22static uschar spool_name[256];
23
24
25
26/*************************************************
27* Non-SMTP character reading functions *
28*************************************************/
29
30/* These are the default functions that are set up in the variables such as
31receive_getc initially. They just call the standard functions, passing stdin as
32the file. (When SMTP input is occurring, different functions are used by
33changing the pointer variables.) */
34
35int
36stdin_getc(void)
37{
38return getc(stdin);
39}
40
41int
42stdin_ungetc(int c)
43{
44return ungetc(c, stdin);
45}
46
47int
48stdin_feof(void)
49{
50return feof(stdin);
51}
52
53int
54stdin_ferror(void)
55{
56return ferror(stdin);
57}
58
59
60
61
62/*************************************************
63* Check that a set sender is allowed *
64*************************************************/
65
66/* This function is called when a local caller sets an explicit sender address.
67It checks whether this is permitted, which it is for trusted callers.
68Otherwise, it must match the pattern(s) in untrusted_set_sender.
69
70Arguments: the proposed sender address
71Returns: TRUE for a trusted caller
72 TRUE if the address has been set, untrusted_set_sender has been
73 set, and the address matches something in the list
74 FALSE otherwise
75*/
76
77BOOL
78receive_check_set_sender(uschar *newsender)
79{
80uschar *qnewsender;
81if (trusted_caller) return TRUE;
82if (newsender == NULL || untrusted_set_sender == NULL) return FALSE;
83qnewsender = (Ustrchr(newsender, '@') != NULL)?
84 newsender : string_sprintf("%s@%s", newsender, qualify_domain_sender);
85return
86 match_address_list(qnewsender, TRUE, TRUE, &untrusted_set_sender, NULL, -1,
87 0, NULL) == OK;
88}
89
90
91
92
93/*************************************************
5cb8cbc6 94* Read space info for a partition *
059ec3d9
PH
95*************************************************/
96
8e669ac1
PH
97/* This function is called by receive_check_fs() below, and also by string
98expansion for variables such as $spool_space. The field names for the statvfs
5cb8cbc6
PH
99structure are macros, because not all OS have F_FAVAIL and it seems tidier to
100have macros for F_BAVAIL and F_FILES as well. Some kinds of file system do not
101have inodes, and they return -1 for the number available.
059ec3d9 102
5cb8cbc6
PH
103Later: It turns out that some file systems that do not have the concept of
104inodes return 0 rather than -1. Such systems should also return 0 for the total
8e669ac1 105number of inodes, so we require that to be greater than zero before returning
5cb8cbc6 106an inode count.
059ec3d9 107
5cb8cbc6
PH
108Arguments:
109 isspool TRUE for spool partition, FALSE for log partition
110 inodeptr address of int to receive inode count; -1 if there isn't one
8e669ac1 111
5cb8cbc6 112Returns: available on-root space, in kilobytes
8e669ac1
PH
113 -1 for log partition if there isn't one
114
115All values are -1 if the STATFS functions are not available.
059ec3d9
PH
116*/
117
8e669ac1 118int
5cb8cbc6 119receive_statvfs(BOOL isspool, int *inodeptr)
059ec3d9
PH
120{
121#ifdef HAVE_STATFS
059ec3d9 122struct STATVFS statbuf;
5cb8cbc6
PH
123uschar *path;
124uschar *name;
125uschar buffer[1024];
059ec3d9 126
5cb8cbc6 127/* The spool directory must always exist. */
059ec3d9 128
5cb8cbc6 129if (isspool)
059ec3d9 130 {
8e669ac1
PH
131 path = spool_directory;
132 name = US"spool";
133 }
134
059ec3d9
PH
135/* Need to cut down the log file path to the directory, and to ignore any
136appearance of "syslog" in it. */
137
5cb8cbc6 138else
059ec3d9 139 {
059ec3d9 140 int sep = ':'; /* Not variable - outside scripts use */
059ec3d9 141 uschar *p = log_file_path;
8e669ac1 142 name = US"log";
059ec3d9
PH
143
144 /* An empty log_file_path means "use the default". This is the same as an
145 empty item in a list. */
146
147 if (*p == 0) p = US":";
148 while ((path = string_nextinlist(&p, &sep, buffer, sizeof(buffer))) != NULL)
149 {
150 if (Ustrcmp(path, "syslog") != 0) break;
151 }
152
5cb8cbc6
PH
153 if (path == NULL) /* No log files */
154 {
8e669ac1
PH
155 *inodeptr = -1;
156 return -1;
157 }
059ec3d9 158
8e669ac1
PH
159 /* An empty string means use the default, which is in the spool directory.
160 But don't just use the spool directory, as it is possible that the log
5cb8cbc6 161 subdirectory has been symbolically linked elsewhere. */
059ec3d9 162
8e669ac1 163 if (path[0] == 0)
059ec3d9 164 {
5cb8cbc6
PH
165 sprintf(CS buffer, CS"%s/log", CS spool_directory);
166 path = buffer;
8e669ac1
PH
167 }
168 else
059ec3d9 169 {
8e669ac1 170 uschar *cp;
5cb8cbc6 171 if ((cp = Ustrrchr(path, '/')) != NULL) *cp = 0;
8e669ac1 172 }
5cb8cbc6 173 }
8e669ac1 174
8f128379 175/* We now have the path; do the business */
5cb8cbc6
PH
176
177memset(&statbuf, 0, sizeof(statbuf));
178
179if (STATVFS(CS path, &statbuf) != 0)
180 {
181 log_write(0, LOG_MAIN|LOG_PANIC, "cannot accept message: failed to stat "
182 "%s directory %s: %s", name, spool_directory, strerror(errno));
183 smtp_closedown(US"spool or log directory problem");
184 exim_exit(EXIT_FAILURE);
185 }
8e669ac1 186
5cb8cbc6
PH
187*inodeptr = (statbuf.F_FILES > 0)? statbuf.F_FAVAIL : -1;
188
189/* Disks are getting huge. Take care with computing the size in kilobytes. */
8e669ac1 190
5cb8cbc6
PH
191return (int)(((double)statbuf.F_BAVAIL * (double)statbuf.F_FRSIZE)/1024.0);
192
193/* Unable to find partition sizes in this environment. */
194
195#else
196*inodeptr = -1;
197return -1;
198#endif
199}
200
059ec3d9 201
059ec3d9 202
5cb8cbc6
PH
203
204/*************************************************
205* Check space on spool and log partitions *
206*************************************************/
207
208/* This function is called before accepting a message; if any thresholds are
209set, it checks them. If a message_size is supplied, it checks that there is
210enough space for that size plus the threshold - i.e. that the message won't
211reduce the space to the threshold. Not all OS have statvfs(); for those that
212don't, this function always returns TRUE. For some OS the old function and
213struct name statfs is used; that is handled by a macro, defined in exim.h.
214
215Arguments:
216 msg_size the (estimated) size of an incoming message
217
218Returns: FALSE if there isn't enough space, or if the information cannot
219 be obtained
220 TRUE if no check was done or there is enough space
221*/
222
223BOOL
224receive_check_fs(int msg_size)
225{
226int space, inodes;
227
228if (check_spool_space > 0 || msg_size > 0 || check_spool_inodes > 0)
229 {
8e669ac1
PH
230 space = receive_statvfs(TRUE, &inodes);
231
059ec3d9 232 DEBUG(D_receive)
5cb8cbc6
PH
233 debug_printf("spool directory space = %dK inodes = %d "
234 "check_space = %dK inodes = %d msg_size = %d\n",
235 space, inodes, check_spool_space, check_spool_inodes, msg_size);
8e669ac1
PH
236
237 if ((space >= 0 && space < check_spool_space) ||
5cb8cbc6 238 (inodes >= 0 && inodes < check_spool_inodes))
8e669ac1 239 {
5cb8cbc6
PH
240 log_write(0, LOG_MAIN, "spool directory space check failed: space=%d "
241 "inodes=%d", space, inodes);
059ec3d9
PH
242 return FALSE;
243 }
244 }
245
5cb8cbc6
PH
246if (check_log_space > 0 || check_log_inodes > 0)
247 {
8e669ac1
PH
248 space = receive_statvfs(FALSE, &inodes);
249
5cb8cbc6
PH
250 DEBUG(D_receive)
251 debug_printf("log directory space = %dK inodes = %d "
252 "check_space = %dK inodes = %d\n",
253 space, inodes, check_log_space, check_log_inodes);
8e669ac1
PH
254
255 if ((space >= 0 && space < check_log_space) ||
5cb8cbc6 256 (inodes >= 0 && inodes < check_log_inodes))
8e669ac1 257 {
5cb8cbc6
PH
258 log_write(0, LOG_MAIN, "log directory space check failed: space=%d "
259 "inodes=%d", space, inodes);
260 return FALSE;
261 }
8e669ac1
PH
262 }
263
059ec3d9
PH
264return TRUE;
265}
266
267
268
269/*************************************************
270* Bomb out while reading a message *
271*************************************************/
272
273/* The common case of wanting to bomb out is if a SIGTERM or SIGINT is
274received, or if there is a timeout. A rarer case might be if the log files are
275screwed up and Exim can't open them to record a message's arrival. Handling
276that case is done by setting a flag to cause the log functions to call this
277function if there is an ultimate disaster. That is why it is globally
278accessible.
279
8f128379
PH
280Arguments:
281 reason text reason to pass to the not-quit ACL
282 msg default SMTP response to give if in an SMTP session
059ec3d9
PH
283Returns: it doesn't
284*/
285
286void
8f128379 287receive_bomb_out(uschar *reason, uschar *msg)
059ec3d9 288{
ead37e6c
PP
289 static BOOL already_bombing_out;
290/* The smtp_notquit_exit() below can call ACLs which can trigger recursive
291timeouts, if someone has something slow in their quit ACL. Since the only
292things we should be doing are to close down cleanly ASAP, on the second
293pass we also close down stuff that might be opened again, before bypassing
294the ACL call and exiting. */
295
059ec3d9
PH
296/* If spool_name is set, it contains the name of the data file that is being
297written. Unlink it before closing so that it cannot be picked up by a delivery
298process. Ensure that any header file is also removed. */
299
ead37e6c 300if (spool_name[0] != '\0')
059ec3d9
PH
301 {
302 Uunlink(spool_name);
303 spool_name[Ustrlen(spool_name) - 1] = 'H';
304 Uunlink(spool_name);
ead37e6c 305 spool_name[0] = '\0';
059ec3d9
PH
306 }
307
308/* Now close the file if it is open, either as a fd or a stream. */
309
ead37e6c
PP
310if (data_file != NULL)
311 {
312 (void)fclose(data_file);
313 data_file = NULL;
314} else if (data_fd >= 0) {
315 (void)close(data_fd);
316 data_fd = -1;
317 }
059ec3d9 318
8f128379
PH
319/* Attempt to close down an SMTP connection tidily. For non-batched SMTP, call
320smtp_notquit_exit(), which runs the NOTQUIT ACL, if present, and handles the
321SMTP response. */
059ec3d9 322
ead37e6c 323if (!already_bombing_out)
059ec3d9 324 {
ead37e6c
PP
325 already_bombing_out = TRUE;
326 if (smtp_input)
327 {
328 if (smtp_batched_input)
329 moan_smtp_batch(NULL, "421 %s - message abandoned", msg); /* No return */
330 smtp_notquit_exit(reason, US"421", US"%s %s - closing connection.",
331 smtp_active_hostname, msg);
332 }
059ec3d9
PH
333 }
334
335/* Exit from the program (non-BSMTP cases) */
336
337exim_exit(EXIT_FAILURE);
338}
339
340
341/*************************************************
342* Data read timeout *
343*************************************************/
344
345/* Handler function for timeouts that occur while reading the data that
346comprises a message.
347
348Argument: the signal number
349Returns: nothing
350*/
351
352static void
353data_timeout_handler(int sig)
354{
355uschar *msg = NULL;
356
357sig = sig; /* Keep picky compilers happy */
358
359if (smtp_input)
360 {
361 msg = US"SMTP incoming data timeout";
362 log_write(L_lost_incoming_connection,
363 LOG_MAIN, "SMTP data timeout (message abandoned) on connection "
fed77020
PH
364 "from %s F=<%s>",
365 (sender_fullhost != NULL)? sender_fullhost : US"local process",
366 sender_address);
059ec3d9
PH
367 }
368else
369 {
370 fprintf(stderr, "exim: timed out while reading - message abandoned\n");
371 log_write(L_lost_incoming_connection,
372 LOG_MAIN, "timed out while reading local message");
373 }
374
8f128379 375receive_bomb_out(US"data-timeout", msg); /* Does not return */
059ec3d9
PH
376}
377
378
379
380/*************************************************
381* local_scan() timeout *
382*************************************************/
383
384/* Handler function for timeouts that occur while running a local_scan()
385function.
386
387Argument: the signal number
388Returns: nothing
389*/
390
391static void
392local_scan_timeout_handler(int sig)
393{
394sig = sig; /* Keep picky compilers happy */
395log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function timed out - "
396 "message temporarily rejected (size %d)", message_size);
8f128379
PH
397/* Does not return */
398receive_bomb_out(US"local-scan-timeout", US"local verification problem");
059ec3d9
PH
399}
400
401
402
403/*************************************************
404* local_scan() crashed *
405*************************************************/
406
407/* Handler function for signals that occur while running a local_scan()
408function.
409
410Argument: the signal number
411Returns: nothing
412*/
413
414static void
415local_scan_crash_handler(int sig)
416{
417log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function crashed with "
418 "signal %d - message temporarily rejected (size %d)", sig, message_size);
8f128379
PH
419/* Does not return */
420receive_bomb_out(US"local-scan-error", US"local verification problem");
059ec3d9
PH
421}
422
423
424/*************************************************
425* SIGTERM or SIGINT received *
426*************************************************/
427
428/* Handler for SIGTERM or SIGINT signals that occur while reading the
429data that comprises a message.
430
431Argument: the signal number
432Returns: nothing
433*/
434
435static void
436data_sigterm_sigint_handler(int sig)
437{
438uschar *msg = NULL;
439
440if (smtp_input)
441 {
442 msg = US"Service not available - SIGTERM or SIGINT received";
443 log_write(0, LOG_MAIN, "%s closed after %s", smtp_get_connection_info(),
444 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
445 }
446else
447 {
f05da2e8 448 if (filter_test == FTEST_NONE)
059ec3d9
PH
449 {
450 fprintf(stderr, "\nexim: %s received - message abandoned\n",
451 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
452 log_write(0, LOG_MAIN, "%s received while reading local message",
453 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
454 }
455 }
456
8f128379 457receive_bomb_out(US"signal-exit", msg); /* Does not return */
059ec3d9
PH
458}
459
460
461
462/*************************************************
463* Add new recipient to list *
464*************************************************/
465
466/* This function builds a list of recipient addresses in argc/argv
467format.
468
469Arguments:
470 recipient the next address to add to recipients_list
471 pno parent number for fixed aliases; -1 otherwise
472
473Returns: nothing
474*/
475
476void
477receive_add_recipient(uschar *recipient, int pno)
478{
479if (recipients_count >= recipients_list_max)
480 {
481 recipient_item *oldlist = recipients_list;
482 int oldmax = recipients_list_max;
483 recipients_list_max = recipients_list_max? 2*recipients_list_max : 50;
484 recipients_list = store_get(recipients_list_max * sizeof(recipient_item));
485 if (oldlist != NULL)
486 memcpy(recipients_list, oldlist, oldmax * sizeof(recipient_item));
487 }
488
489recipients_list[recipients_count].address = recipient;
490recipients_list[recipients_count].pno = pno;
8523533c
TK
491#ifdef EXPERIMENTAL_BRIGHTMAIL
492recipients_list[recipients_count].bmi_optin = bmi_current_optin;
493/* reset optin string pointer for next recipient */
494bmi_current_optin = NULL;
495#endif
059ec3d9
PH
496recipients_list[recipients_count++].errors_to = NULL;
497}
498
499
500
501
502/*************************************************
fd98a5c6
JH
503* Send user response message *
504*************************************************/
505
506/* This function is passed a default response code and a user message. It calls
507smtp_message_code() to check and possibly modify the response code, and then
508calls smtp_respond() to transmit the response. I put this into a function
509just to avoid a lot of repetition.
510
511Arguments:
512 code the response code
513 user_msg the user message
514
515Returns: nothing
516*/
517
518static void
519smtp_user_msg(uschar *code, uschar *user_msg)
520{
521int len = 3;
522smtp_message_code(&code, &len, &user_msg, NULL);
523smtp_respond(code, len, TRUE, user_msg);
524}
525
526
527
528
529
530/*************************************************
059ec3d9
PH
531* Remove a recipient from the list *
532*************************************************/
533
534/* This function is provided for local_scan() to use.
535
536Argument:
537 recipient address to remove
538
539Returns: TRUE if it did remove something; FALSE otherwise
540*/
541
542BOOL
543receive_remove_recipient(uschar *recipient)
544{
545int count;
546DEBUG(D_receive) debug_printf("receive_remove_recipient(\"%s\") called\n",
547 recipient);
548for (count = 0; count < recipients_count; count++)
549 {
550 if (Ustrcmp(recipients_list[count].address, recipient) == 0)
551 {
552 if ((--recipients_count - count) > 0)
553 memmove(recipients_list + count, recipients_list + count + 1,
54cdb463 554 (recipients_count - count)*sizeof(recipient_item));
059ec3d9
PH
555 return TRUE;
556 }
557 }
558return FALSE;
559}
560
561
562
563
564
565/*************************************************
566* Read data portion of a non-SMTP message *
567*************************************************/
568
569/* This function is called to read the remainder of a message (following the
570header) when the input is not from SMTP - we are receiving a local message on
571a standard input stream. The message is always terminated by EOF, and is also
572terminated by a dot on a line by itself if the flag dot_ends is TRUE. Split the
573two cases for maximum efficiency.
574
575Ensure that the body ends with a newline. This will naturally be the case when
576the termination is "\n.\n" but may not be otherwise. The RFC defines messages
577as "sequences of lines" - this of course strictly applies only to SMTP, but
578deliveries into BSD-type mailbox files also require it. Exim used to have a
579flag for doing this at delivery time, but as it was always set for all
580transports, I decided to simplify things by putting the check here instead.
581
582There is at least one MUA (dtmail) that sends CRLF via this interface, and
583other programs are known to do this as well. Exim used to have a option for
584dealing with this: in July 2003, after much discussion, the code has been
585changed to default to treat any of LF, CRLF, and bare CR as line terminators.
586
587However, for the case when a dot on a line by itself terminates a message, the
588only recognized terminating sequences before and after the dot are LF and CRLF.
589Otherwise, having read EOL . CR, you don't know whether to read another
590character or not.
591
592Internally, in messages stored in Exim's spool files, LF is used as the line
593terminator. Under the new regime, bare CRs will no longer appear in these
594files.
595
596Arguments:
597 fout a FILE to which to write the message
598
599Returns: One of the END_xxx values indicating why it stopped reading
600*/
601
602static int
603read_message_data(FILE *fout)
604{
605int ch_state;
606register int ch;
d677b2f2 607register int linelength = 0;
059ec3d9
PH
608
609/* Handle the case when only EOF terminates the message */
610
611if (!dot_ends)
612 {
613 register int last_ch = '\n';
614
80a47a2c 615 for (; (ch = (receive_getc)()) != EOF; last_ch = ch)
059ec3d9
PH
616 {
617 if (ch == 0) body_zerocount++;
618 if (last_ch == '\r' && ch != '\n')
619 {
d677b2f2
PH
620 if (linelength > max_received_linelength)
621 max_received_linelength = linelength;
622 linelength = 0;
059ec3d9
PH
623 if (fputc('\n', fout) == EOF) return END_WERROR;
624 message_size++;
625 body_linecount++;
626 }
627 if (ch == '\r') continue;
628
629 if (fputc(ch, fout) == EOF) return END_WERROR;
d677b2f2
PH
630 if (ch == '\n')
631 {
632 if (linelength > max_received_linelength)
633 max_received_linelength = linelength;
634 linelength = 0;
635 body_linecount++;
636 }
637 else linelength++;
059ec3d9
PH
638 if (++message_size > thismessage_size_limit) return END_SIZE;
639 }
640
641 if (last_ch != '\n')
642 {
d677b2f2
PH
643 if (linelength > max_received_linelength)
644 max_received_linelength = linelength;
059ec3d9
PH
645 if (fputc('\n', fout) == EOF) return END_WERROR;
646 message_size++;
647 body_linecount++;
648 }
649
650 return END_EOF;
651 }
652
653/* Handle the case when a dot on a line on its own, or EOF, terminates. */
654
655ch_state = 1;
656
80a47a2c 657while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
658 {
659 if (ch == 0) body_zerocount++;
660 switch (ch_state)
661 {
662 case 0: /* Normal state (previous char written) */
663 if (ch == '\n')
d677b2f2
PH
664 {
665 body_linecount++;
666 if (linelength > max_received_linelength)
667 max_received_linelength = linelength;
668 linelength = -1;
669 ch_state = 1;
670 }
059ec3d9
PH
671 else if (ch == '\r')
672 { ch_state = 2; continue; }
673 break;
674
675 case 1: /* After written "\n" */
676 if (ch == '.') { ch_state = 3; continue; }
d677b2f2 677 if (ch != '\n') ch_state = 0; else linelength = -1;
059ec3d9
PH
678 break;
679
680 case 2:
681 body_linecount++; /* After unwritten "\r" */
d677b2f2
PH
682 if (linelength > max_received_linelength)
683 max_received_linelength = linelength;
059ec3d9 684 if (ch == '\n')
d677b2f2
PH
685 {
686 ch_state = 1;
687 linelength = -1;
688 }
059ec3d9
PH
689 else
690 {
691 if (message_size++, fputc('\n', fout) == EOF) return END_WERROR;
692 if (ch == '\r') continue;
693 ch_state = 0;
d677b2f2 694 linelength = 0;
059ec3d9
PH
695 }
696 break;
697
698 case 3: /* After "\n." (\n written, dot not) */
699 if (ch == '\n') return END_DOT;
700 if (ch == '\r') { ch_state = 4; continue; }
701 message_size++;
d677b2f2 702 linelength++;
059ec3d9
PH
703 if (fputc('.', fout) == EOF) return END_WERROR;
704 ch_state = 0;
705 break;
706
707 case 4: /* After "\n.\r" (\n written, rest not) */
708 if (ch == '\n') return END_DOT;
709 message_size += 2;
710 body_linecount++;
711 if (fputs(".\n", fout) == EOF) return END_WERROR;
712 if (ch == '\r') { ch_state = 2; continue; }
713 ch_state = 0;
714 break;
715 }
716
d677b2f2 717 linelength++;
059ec3d9
PH
718 if (fputc(ch, fout) == EOF) return END_WERROR;
719 if (++message_size > thismessage_size_limit) return END_SIZE;
720 }
721
722/* Get here if EOF read. Unless we have just written "\n", we need to ensure
723the message ends with a newline, and we must also write any characters that
724were saved up while testing for an ending dot. */
725
726if (ch_state != 1)
727 {
728 static uschar *ends[] = { US"\n", NULL, US"\n", US".\n", US".\n" };
729 if (fputs(CS ends[ch_state], fout) == EOF) return END_WERROR;
730 message_size += Ustrlen(ends[ch_state]);
731 body_linecount++;
732 }
733
734return END_EOF;
735}
736
737
738
739
740/*************************************************
741* Read data portion of an SMTP message *
742*************************************************/
743
744/* This function is called to read the remainder of an SMTP message (after the
745headers), or to skip over it when an error has occurred. In this case, the
746output file is passed as NULL.
747
748If any line begins with a dot, that character is skipped. The input should only
749be successfully terminated by CR LF . CR LF unless it is local (non-network)
750SMTP, in which case the CRs are optional, but...
751
752FUDGE: It seems that sites on the net send out messages with just LF
753terminators, despite the warnings in the RFCs, and other MTAs handle this. So
754we make the CRs optional in all cases.
755
756July 2003: Bare CRs cause trouble. We now treat them as line terminators as
757well, so that there are no CRs in spooled messages. However, the message
758terminating dot is not recognized between two bare CRs.
759
760Arguments:
761 fout a FILE to which to write the message; NULL if skipping
762
763Returns: One of the END_xxx values indicating why it stopped reading
764*/
765
766static int
767read_message_data_smtp(FILE *fout)
768{
769int ch_state = 0;
e4bdf652 770int ch;
1f5497b2 771register int linelength = 0;
059ec3d9 772
80a47a2c 773while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
774 {
775 if (ch == 0) body_zerocount++;
776 switch (ch_state)
777 {
778 case 0: /* After LF or CRLF */
779 if (ch == '.')
780 {
781 ch_state = 3;
782 continue; /* Don't ever write . after LF */
783 }
784 ch_state = 1;
785
786 /* Else fall through to handle as normal uschar. */
787
788 case 1: /* Normal state */
789 if (ch == '\n')
790 {
791 ch_state = 0;
792 body_linecount++;
1f5497b2
PH
793 if (linelength > max_received_linelength)
794 max_received_linelength = linelength;
795 linelength = -1;
059ec3d9
PH
796 }
797 else if (ch == '\r')
798 {
799 ch_state = 2;
800 continue;
801 }
802 break;
803
804 case 2: /* After (unwritten) CR */
805 body_linecount++;
1f5497b2
PH
806 if (linelength > max_received_linelength)
807 max_received_linelength = linelength;
808 linelength = -1;
059ec3d9
PH
809 if (ch == '\n')
810 {
811 ch_state = 0;
812 }
813 else
814 {
815 message_size++;
816 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 817 (void) cutthrough_put_nl();
059ec3d9
PH
818 if (ch != '\r') ch_state = 1; else continue;
819 }
820 break;
821
822 case 3: /* After [CR] LF . */
823 if (ch == '\n')
824 return END_DOT;
825 if (ch == '\r')
826 {
827 ch_state = 4;
828 continue;
829 }
830 ch_state = 1; /* The dot itself is removed */
831 break;
832
833 case 4: /* After [CR] LF . CR */
834 if (ch == '\n') return END_DOT;
835 message_size++;
836 body_linecount++;
837 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 838 (void) cutthrough_put_nl();
059ec3d9
PH
839 if (ch == '\r')
840 {
841 ch_state = 2;
842 continue;
843 }
844 ch_state = 1;
845 break;
846 }
847
848 /* Add the character to the spool file, unless skipping; then loop for the
849 next. */
850
851 message_size++;
1f5497b2 852 linelength++;
059ec3d9
PH
853 if (fout != NULL)
854 {
855 if (fputc(ch, fout) == EOF) return END_WERROR;
856 if (message_size > thismessage_size_limit) return END_SIZE;
857 }
e4bdf652
JH
858 if(ch == '\n')
859 (void) cutthrough_put_nl();
860 else
861 {
862 uschar c= ch;
863 (void) cutthrough_puts(&c, 1);
864 }
059ec3d9
PH
865 }
866
867/* Fall through here if EOF encountered. This indicates some kind of error,
868since a correct message is terminated by [CR] LF . [CR] LF. */
869
870return END_EOF;
871}
872
873
874
875
876/*************************************************
877* Swallow SMTP message *
878*************************************************/
879
880/* This function is called when there has been some kind of error while reading
881an SMTP message, and the remaining data may need to be swallowed. It is global
882because it is called from smtp_closedown() to shut down an incoming call
883tidily.
884
885Argument: a FILE from which to read the message
886Returns: nothing
887*/
888
889void
890receive_swallow_smtp(void)
891{
892if (message_ended >= END_NOTENDED)
893 message_ended = read_message_data_smtp(NULL);
894}
895
896
897
898/*************************************************
899* Handle lost SMTP connection *
900*************************************************/
901
902/* This function logs connection loss incidents and generates an appropriate
903SMTP response.
904
905Argument: additional data for the message
906Returns: the SMTP response
907*/
908
909static uschar *
910handle_lost_connection(uschar *s)
911{
912log_write(L_lost_incoming_connection | L_smtp_connection, LOG_MAIN,
913 "%s lost while reading message data%s", smtp_get_connection_info(), s);
914return US"421 Lost incoming connection";
915}
916
917
918
919
920/*************************************************
921* Handle a non-smtp reception error *
922*************************************************/
923
924/* This function is called for various errors during the reception of non-SMTP
925messages. It either sends a message to the sender of the problem message, or it
926writes to the standard error stream.
927
928Arguments:
929 errcode code for moan_to_sender(), identifying the error
930 text1 first message text, passed to moan_to_sender()
931 text2 second message text, used only for stderrr
932 error_rc code to pass to exim_exit if no problem
933 f FILE containing body of message (may be stdin)
934 hptr pointer to instore headers or NULL
935
936Returns: calls exim_exit(), which does not return
937*/
938
939static void
940give_local_error(int errcode, uschar *text1, uschar *text2, int error_rc,
941 FILE *f, header_line *hptr)
942{
943if (error_handling == ERRORS_SENDER)
944 {
945 error_block eblock;
946 eblock.next = NULL;
947 eblock.text1 = text1;
948 if (!moan_to_sender(errcode, &eblock, hptr, f, FALSE))
949 error_rc = EXIT_FAILURE;
950 }
951else fprintf(stderr, "exim: %s%s\n", text2, text1); /* Sic */
f1e894f3 952(void)fclose(f);
059ec3d9
PH
953exim_exit(error_rc);
954}
955
956
957
958/*************************************************
959* Add header lines set up by ACL *
960*************************************************/
961
850635b6
PH
962/* This function is called to add the header lines that were set up by
963statements in an ACL to the list of headers in memory. It is done in two stages
964like this, because when the ACL for RCPT is running, the other headers have not
965yet been received. This function is called twice; once just before running the
966DATA ACL, and once after. This is so that header lines added by MAIL or RCPT
967are visible to the DATA ACL.
059ec3d9
PH
968
969Originally these header lines were added at the end. Now there is support for
970three different places: top, bottom, and after the Received: header(s). There
971will always be at least one Received: header, even if it is marked deleted, and
972even if something else has been put in front of it.
973
974Arguments:
975 acl_name text to identify which ACL
976
977Returns: nothing
978*/
979
980static void
981add_acl_headers(uschar *acl_name)
982{
983header_line *h, *next;
984header_line *last_received = NULL;
e7568d51
TL
985
986if (acl_removed_headers != NULL)
987 {
988 DEBUG(D_receive|D_acl) debug_printf(">>Headers removed by %s ACL:\n", acl_name);
989
990 for (h = header_list; h != NULL; h = h->next)
991 {
e7568d51
TL
992 uschar *list;
993 BOOL include_header;
994
995 if (h->type == htype_old) continue;
996
997 include_header = TRUE;
998 list = acl_removed_headers;
999
1000 int sep = ':'; /* This is specified as a colon-separated list */
1001 uschar *s;
1002 uschar buffer[128];
1003 while ((s = string_nextinlist(&list, &sep, buffer, sizeof(buffer)))
1004 != NULL)
1005 {
1006 int len = Ustrlen(s);
1007 if (header_testname(h, s, len, FALSE))
1008 {
1009 h->type = htype_old;
1010 DEBUG(D_receive|D_acl) debug_printf(" %s", h->text);
1011 }
1012 }
1013 }
1014 acl_removed_headers = NULL;
1015 DEBUG(D_receive|D_acl) debug_printf(">>\n");
1016 }
059ec3d9 1017
71fafd95 1018if (acl_added_headers == NULL) return;
059ec3d9
PH
1019DEBUG(D_receive|D_acl) debug_printf(">>Headers added by %s ACL:\n", acl_name);
1020
71fafd95 1021for (h = acl_added_headers; h != NULL; h = next)
059ec3d9
PH
1022 {
1023 next = h->next;
1024
1025 switch(h->type)
1026 {
1027 case htype_add_top:
1028 h->next = header_list;
1029 header_list = h;
1030 DEBUG(D_receive|D_acl) debug_printf(" (at top)");
1031 break;
1032
1033 case htype_add_rec:
1034 if (last_received == NULL)
1035 {
1036 last_received = header_list;
1037 while (!header_testname(last_received, US"Received", 8, FALSE))
1038 last_received = last_received->next;
1039 while (last_received->next != NULL &&
1040 header_testname(last_received->next, US"Received", 8, FALSE))
1041 last_received = last_received->next;
1042 }
1043 h->next = last_received->next;
1044 last_received->next = h;
1045 DEBUG(D_receive|D_acl) debug_printf(" (after Received:)");
1046 break;
1047
8523533c
TK
1048 case htype_add_rfc:
1049 /* add header before any header which is NOT Received: or Resent- */
1050 last_received = header_list;
1051 while ( (last_received->next != NULL) &&
1052 ( (header_testname(last_received->next, US"Received", 8, FALSE)) ||
1053 (header_testname_incomplete(last_received->next, US"Resent-", 7, FALSE)) ) )
1054 last_received = last_received->next;
1055 /* last_received now points to the last Received: or Resent-* header
1056 in an uninterrupted chain of those header types (seen from the beginning
1057 of all headers. Our current header must follow it. */
1058 h->next = last_received->next;
1059 last_received->next = h;
8e669ac1 1060 DEBUG(D_receive|D_acl) debug_printf(" (before any non-Received: or Resent-*: header)");
8523533c
TK
1061 break;
1062
059ec3d9
PH
1063 default:
1064 h->next = NULL;
1065 header_last->next = h;
1066 break;
1067 }
1068
1069 if (h->next == NULL) header_last = h;
1070
1071 /* Check for one of the known header types (From:, To:, etc.) though in
1072 practice most added headers are going to be "other". Lower case
1073 identification letters are never stored with the header; they are used
1074 for existence tests when messages are received. So discard any lower case
1075 flag values. */
1076
1077 h->type = header_checkname(h, FALSE);
1078 if (h->type >= 'a') h->type = htype_other;
1079
1080 DEBUG(D_receive|D_acl) debug_printf(" %s", header_last->text);
1081 }
1082
71fafd95 1083acl_added_headers = NULL;
059ec3d9
PH
1084DEBUG(D_receive|D_acl) debug_printf(">>\n");
1085}
1086
1087
1088
1089/*************************************************
1090* Add host information for log line *
1091*************************************************/
1092
1093/* Called for acceptance and rejecting log lines. This adds information about
1094the calling host to a string that is being built dynamically.
1095
1096Arguments:
1097 s the dynamic string
1098 sizeptr points to the size variable
1099 ptrptr points to the pointer variable
1100
1101Returns: the extended string
1102*/
1103
1104static uschar *
1105add_host_info_for_log(uschar *s, int *sizeptr, int *ptrptr)
1106{
1107if (sender_fullhost != NULL)
1108 {
1109 s = string_append(s, sizeptr, ptrptr, 2, US" H=", sender_fullhost);
1110 if ((log_extra_selector & LX_incoming_interface) != 0 &&
1111 interface_address != NULL)
1112 {
1113 uschar *ss = string_sprintf(" I=[%s]:%d", interface_address,
1114 interface_port);
1115 s = string_cat(s, sizeptr, ptrptr, ss, Ustrlen(ss));
1116 }
1117 }
1118if (sender_ident != NULL)
1119 s = string_append(s, sizeptr, ptrptr, 2, US" U=", sender_ident);
1120if (received_protocol != NULL)
1121 s = string_append(s, sizeptr, ptrptr, 2, US" P=", received_protocol);
1122return s;
1123}
1124
1125
1126
63955bf2 1127#ifdef WITH_CONTENT_SCAN
059ec3d9
PH
1128
1129/*************************************************
54cdb463
PH
1130* Run the MIME ACL on a message *
1131*************************************************/
1132
1133/* This code is in a subroutine so that it can be used for both SMTP
1134and non-SMTP messages. It is called with a non-NULL ACL pointer.
1135
1136Arguments:
1137 acl The ACL to run (acl_smtp_mime or acl_not_smtp_mime)
1138 smtp_yield_ptr Set FALSE to kill messages after dropped connection
1139 smtp_reply_ptr Where SMTP reply is being built
1140 blackholed_by_ptr Where "blackholed by" message is being built
1141
1142Returns: TRUE to carry on; FALSE to abandon the message
1143*/
1144
1145static BOOL
1146run_mime_acl(uschar *acl, BOOL *smtp_yield_ptr, uschar **smtp_reply_ptr,
1147 uschar **blackholed_by_ptr)
1148{
1149FILE *mbox_file;
1150uschar rfc822_file_path[2048];
1151unsigned long mbox_size;
1152header_line *my_headerlist;
1153uschar *user_msg, *log_msg;
1154int mime_part_count_buffer = -1;
7156b1ef 1155int rc = OK;
54cdb463
PH
1156
1157memset(CS rfc822_file_path,0,2048);
1158
1159/* check if it is a MIME message */
1160my_headerlist = header_list;
4e88a19f
PH
1161while (my_headerlist != NULL)
1162 {
54cdb463 1163 /* skip deleted headers */
4e88a19f
PH
1164 if (my_headerlist->type == '*')
1165 {
54cdb463
PH
1166 my_headerlist = my_headerlist->next;
1167 continue;
4e88a19f
PH
1168 }
1169 if (strncmpic(my_headerlist->text, US"Content-Type:", 13) == 0)
1170 {
54cdb463
PH
1171 DEBUG(D_receive) debug_printf("Found Content-Type: header - executing acl_smtp_mime.\n");
1172 goto DO_MIME_ACL;
4e88a19f 1173 }
54cdb463 1174 my_headerlist = my_headerlist->next;
4e88a19f 1175 }
54cdb463
PH
1176
1177DEBUG(D_receive) debug_printf("No Content-Type: header - presumably not a MIME message.\n");
1178return TRUE;
1179
1180DO_MIME_ACL:
1181/* make sure the eml mbox file is spooled up */
8544e77a 1182mbox_file = spool_mbox(&mbox_size, NULL);
54cdb463
PH
1183if (mbox_file == NULL) {
1184 /* error while spooling */
1185 log_write(0, LOG_MAIN|LOG_PANIC,
1186 "acl_smtp_mime: error while creating mbox spool file, message temporarily rejected.");
1187 Uunlink(spool_name);
1188 unspool_mbox();
6f0c431a
PP
1189#ifdef EXPERIMENTAL_DCC
1190 dcc_ok = 0;
1191#endif
a5bd321b 1192 smtp_respond(US"451", 3, TRUE, US"temporary local problem");
54cdb463
PH
1193 message_id[0] = 0; /* Indicate no message accepted */
1194 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1195 return FALSE; /* Indicate skip to end of receive function */
1196};
1197
1198mime_is_rfc822 = 0;
1199
1200MIME_ACL_CHECK:
1201mime_part_count = -1;
1202rc = mime_acl_check(acl, mbox_file, NULL, &user_msg, &log_msg);
f1e894f3 1203(void)fclose(mbox_file);
54cdb463 1204
4e88a19f
PH
1205if (Ustrlen(rfc822_file_path) > 0)
1206 {
54cdb463
PH
1207 mime_part_count = mime_part_count_buffer;
1208
4e88a19f
PH
1209 if (unlink(CS rfc822_file_path) == -1)
1210 {
54cdb463
PH
1211 log_write(0, LOG_PANIC,
1212 "acl_smtp_mime: can't unlink RFC822 spool file, skipping.");
1213 goto END_MIME_ACL;
4e88a19f
PH
1214 }
1215 }
54cdb463
PH
1216
1217/* check if we must check any message/rfc822 attachments */
4e88a19f
PH
1218if (rc == OK)
1219 {
54cdb463
PH
1220 uschar temp_path[1024];
1221 int n;
1222 struct dirent *entry;
1223 DIR *tempdir;
1224
b07e6aa3
PH
1225 (void)string_format(temp_path, 1024, "%s/scan/%s", spool_directory,
1226 message_id);
54cdb463 1227
4e88a19f
PH
1228 tempdir = opendir(CS temp_path);
1229 n = 0;
1230 do
1231 {
1232 entry = readdir(tempdir);
1233 if (entry == NULL) break;
1234 if (strncmpic(US entry->d_name,US"__rfc822_",9) == 0)
1235 {
b07e6aa3 1236 (void)string_format(rfc822_file_path, 2048,"%s/scan/%s/%s", spool_directory, message_id, entry->d_name);
4e88a19f
PH
1237 debug_printf("RFC822 attachment detected: running MIME ACL for '%s'\n", rfc822_file_path);
1238 break;
1239 }
1240 } while (1);
1241 closedir(tempdir);
54cdb463 1242
4e88a19f
PH
1243 if (entry != NULL)
1244 {
c58b88df 1245 mbox_file = Ufopen(rfc822_file_path,"rb");
4e88a19f
PH
1246 if (mbox_file == NULL)
1247 {
54cdb463
PH
1248 log_write(0, LOG_PANIC,
1249 "acl_smtp_mime: can't open RFC822 spool file, skipping.");
1250 unlink(CS rfc822_file_path);
1251 goto END_MIME_ACL;
4e88a19f 1252 }
54cdb463
PH
1253 /* set RFC822 expansion variable */
1254 mime_is_rfc822 = 1;
1255 mime_part_count_buffer = mime_part_count;
1256 goto MIME_ACL_CHECK;
4e88a19f
PH
1257 }
1258 }
54cdb463
PH
1259
1260END_MIME_ACL:
1261add_acl_headers(US"MIME");
1262if (rc == DISCARD)
1263 {
1264 recipients_count = 0;
1265 *blackholed_by_ptr = US"MIME ACL";
1266 }
1267else if (rc != OK)
1268 {
1269 Uunlink(spool_name);
1270 unspool_mbox();
6f0c431a
PP
1271#ifdef EXPERIMENTAL_DCC
1272 dcc_ok = 0;
1273#endif
54cdb463
PH
1274 if (smtp_handle_acl_fail(ACL_WHERE_MIME, rc, user_msg, log_msg) != 0)
1275 *smtp_yield_ptr = FALSE; /* No more messsages after dropped connection */
1276 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1277 message_id[0] = 0; /* Indicate no message accepted */
1278 return FALSE; /* Cause skip to end of receive function */
4e88a19f 1279 }
54cdb463
PH
1280
1281return TRUE;
1282}
1283
63955bf2 1284#endif /* WITH_CONTENT_SCAN */
54cdb463
PH
1285
1286
e4bdf652
JH
1287
1288void
1289received_header_gen(void)
1290{
1291uschar *received;
1292uschar *timestamp;
1293header_line *received_header= header_list;
1294
1295timestamp = expand_string(US"${tod_full}");
1296if (recipients_count == 1) received_for = recipients_list[0].address;
1297received = expand_string(received_header_text);
1298received_for = NULL;
1299
1300if (received == NULL)
1301 {
1302 if(spool_name[0] != 0)
1303 Uunlink(spool_name); /* Lose the data file */
1304 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Expansion of \"%s\" "
1305 "(received_header_text) failed: %s", string_printing(received_header_text),
1306 expand_string_message);
1307 }
1308
1309/* The first element on the header chain is reserved for the Received header,
1310so all we have to do is fill in the text pointer, and set the type. However, if
1311the result of the expansion is an empty string, we leave the header marked as
1312"old" so as to refrain from adding a Received header. */
1313
1314if (received[0] == 0)
1315 {
1316 received_header->text = string_sprintf("Received: ; %s\n", timestamp);
1317 received_header->type = htype_old;
1318 }
1319else
1320 {
1321 received_header->text = string_sprintf("%s; %s\n", received, timestamp);
1322 received_header->type = htype_received;
1323 }
1324
1325received_header->slen = Ustrlen(received_header->text);
1326
1327DEBUG(D_receive) debug_printf(">>Generated Received: header line\n%c %s",
1328 received_header->type, received_header->text);
1329}
1330
1331
1332
54cdb463 1333/*************************************************
059ec3d9
PH
1334* Receive message *
1335*************************************************/
1336
1337/* Receive a message on the given input, and put it into a pair of spool files.
1338Either a non-null list of recipients, or the extract flag will be true, or
1339both. The flag sender_local is true for locally generated messages. The flag
1340submission_mode is true if an ACL has obeyed "control = submission". The flag
8800895a 1341suppress_local_fixups is true if an ACL has obeyed "control =
f4ee74ac
PP
1342suppress_local_fixups" or -G was passed on the command-line.
1343The flag smtp_input is true if the message is to be
8800895a
PH
1344handled using SMTP conventions about termination and lines starting with dots.
1345For non-SMTP messages, dot_ends is true for dot-terminated messages.
059ec3d9
PH
1346
1347If a message was successfully read, message_id[0] will be non-zero.
1348
1349The general actions of this function are:
1350
1351 . Read the headers of the message (if any) into a chain of store
1352 blocks.
1353
1354 . If there is a "sender:" header and the message is locally originated,
69358f02
PH
1355 throw it away, unless the caller is trusted, or unless
1356 active_local_sender_retain is set - which can only happen if
1357 active_local_from_check is false.
059ec3d9
PH
1358
1359 . If recipients are to be extracted from the message, build the
1360 recipients list from the headers, removing any that were on the
1361 original recipients list (unless extract_addresses_remove_arguments is
1362 false), and at the same time, remove any bcc header that may be present.
1363
1364 . Get the spool file for the data, sort out its unique name, open
1365 and lock it (but don't give it the name yet).
1366
1367 . Generate a "Message-Id" header if the message doesn't have one, for
1368 locally-originated messages.
1369
1370 . Generate a "Received" header.
1371
1372 . Ensure the recipients list is fully qualified and rewritten if necessary.
1373
1374 . If there are any rewriting rules, apply them to the sender address
1375 and also to the headers.
1376
1377 . If there is no from: header, generate one, for locally-generated messages
1378 and messages in "submission mode" only.
1379
1380 . If the sender is local, check that from: is correct, and if not, generate
1381 a Sender: header, unless message comes from a trusted caller, or this
69358f02 1382 feature is disabled by active_local_from_check being false.
059ec3d9
PH
1383
1384 . If there is no "date" header, generate one, for locally-originated
1385 or submission mode messages only.
1386
1387 . Copy the rest of the input, or up to a terminating "." if in SMTP or
1388 dot_ends mode, to the data file. Leave it open, to hold the lock.
1389
1390 . Write the envelope and the headers to a new file.
1391
1392 . Set the name for the header file; close it.
1393
1394 . Set the name for the data file; close it.
1395
1396Because this function can potentially be called many times in a single
1397SMTP connection, all store should be got by store_get(), so that it will be
1398automatically retrieved after the message is accepted.
1399
1400FUDGE: It seems that sites on the net send out messages with just LF
1401terminators, despite the warnings in the RFCs, and other MTAs handle this. So
1402we make the CRs optional in all cases.
1403
1404July 2003: Bare CRs in messages, especially in header lines, cause trouble. A
1405new regime is now in place in which bare CRs in header lines are turned into LF
1406followed by a space, so as not to terminate the header line.
1407
1408February 2004: A bare LF in a header line in a message whose first line was
1409terminated by CRLF is treated in the same way as a bare CR.
1410
1411Arguments:
1412 extract_recip TRUE if recipients are to be extracted from the message's
1413 headers
1414
1415Returns: TRUE there are more messages to be read (SMTP input)
1416 FALSE there are no more messages to be read (non-SMTP input
1417 or SMTP connection collapsed, or other failure)
1418
1419When reading a message for filter testing, the returned value indicates
1420whether the headers (which is all that is read) were terminated by '.' or
1421not. */
1422
1423BOOL
1424receive_msg(BOOL extract_recip)
1425{
7156b1ef
NM
1426int i;
1427int rc = FAIL;
059ec3d9
PH
1428int msg_size = 0;
1429int process_info_len = Ustrlen(process_info);
1430int error_rc = (error_handling == ERRORS_SENDER)?
1431 errors_sender_rc : EXIT_FAILURE;
1432int header_size = 256;
1433int start, end, domain, size, sptr;
1434int id_resolution;
1435int had_zero = 0;
d677b2f2 1436int prevlines_length = 0;
059ec3d9
PH
1437
1438register int ptr = 0;
1439
1440BOOL contains_resent_headers = FALSE;
1441BOOL extracted_ignored = FALSE;
1442BOOL first_line_ended_crlf = TRUE_UNSET;
1443BOOL smtp_yield = TRUE;
1444BOOL yield = FALSE;
1445
1446BOOL resents_exist = FALSE;
1447uschar *resent_prefix = US"";
1448uschar *blackholed_by = NULL;
04f7d5b9 1449uschar *blackhole_log_msg = US"";
4ea50c5f 1450int cutthrough_done = 0;
059ec3d9
PH
1451
1452flock_t lock_data;
1453error_block *bad_addresses = NULL;
1454
1455uschar *frozen_by = NULL;
1456uschar *queued_by = NULL;
1457
1458uschar *errmsg, *s;
1459struct stat statbuf;
1460
4e88a19f 1461/* Final message to give to SMTP caller, and messages from ACLs */
059ec3d9
PH
1462
1463uschar *smtp_reply = NULL;
4e88a19f 1464uschar *user_msg, *log_msg;
059ec3d9
PH
1465
1466/* Working header pointers */
1467
1468header_line *h, *next;
1469
2cbb4081 1470/* Flags for noting the existence of certain headers (only one left) */
059ec3d9
PH
1471
1472BOOL date_header_exists = FALSE;
1473
1474/* Pointers to receive the addresses of headers whose contents we need. */
1475
1476header_line *from_header = NULL;
1477header_line *subject_header = NULL;
1478header_line *msgid_header = NULL;
1479header_line *received_header;
1480
1481/* Variables for use when building the Received: header. */
1482
059ec3d9
PH
1483uschar *timestamp;
1484int tslen;
1485
1486/* Release any open files that might have been cached while preparing to
1487accept the message - e.g. by verifying addresses - because reading a message
1488might take a fair bit of real time. */
1489
1490search_tidyup();
1491
e4bdf652
JH
1492/* Extracting the recipient list from an input file is incompatible with
1493cutthrough delivery with the no-spool option. It shouldn't be possible
817d9f57 1494to set up the combination, but just in case kill any ongoing connection. */
e4bdf652 1495if (extract_recip || !smtp_input)
2e5b33cd 1496 cancel_cutthrough_connection("not smtp input");
e4bdf652 1497
059ec3d9
PH
1498/* Initialize the chain of headers by setting up a place-holder for Received:
1499header. Temporarily mark it as "old", i.e. not to be used. We keep header_last
1500pointing to the end of the chain to make adding headers simple. */
1501
1502received_header = header_list = header_last = store_get(sizeof(header_line));
1503header_list->next = NULL;
1504header_list->type = htype_old;
1505header_list->text = NULL;
1506header_list->slen = 0;
1507
1508/* Control block for the next header to be read. */
1509
1510next = store_get(sizeof(header_line));
1511next->text = store_get(header_size);
1512
1513/* Initialize message id to be null (indicating no message read), and the
1514header names list to be the normal list. Indicate there is no data file open
1515yet, initialize the size and warning count, and deal with no size limit. */
1516
1517message_id[0] = 0;
1518data_file = NULL;
1519data_fd = -1;
1520spool_name[0] = 0;
1521message_size = 0;
1522warning_count = 0;
d677b2f2 1523received_count = 1; /* For the one we will add */
059ec3d9
PH
1524
1525if (thismessage_size_limit <= 0) thismessage_size_limit = INT_MAX;
1526
2e0c1448 1527/* While reading the message, the following counts are computed. */
059ec3d9 1528
d677b2f2
PH
1529message_linecount = body_linecount = body_zerocount =
1530 max_received_linelength = 0;
059ec3d9 1531
80a47a2c
TK
1532#ifndef DISABLE_DKIM
1533/* Call into DKIM to set up the context. */
1534if (smtp_input && !smtp_batched_input && !dkim_disable_verify) dkim_exim_verify_init();
fb2274d4
TK
1535#endif
1536
059ec3d9
PH
1537/* Remember the time of reception. Exim uses time+pid for uniqueness of message
1538ids, and fractions of a second are required. See the comments that precede the
1539message id creation below. */
1540
1541(void)gettimeofday(&message_id_tv, NULL);
1542
1543/* For other uses of the received time we can operate with granularity of one
1544second, and for that we use the global variable received_time. This is for
1545things like ultimate message timeouts. */
1546
1547received_time = message_id_tv.tv_sec;
1548
1549/* If SMTP input, set the special handler for timeouts. The alarm() calls
1550happen in the smtp_getc() function when it refills its buffer. */
1551
1552if (smtp_input) os_non_restarting_signal(SIGALRM, data_timeout_handler);
1553
1554/* If not SMTP input, timeout happens only if configured, and we just set a
1555single timeout for the whole message. */
1556
1557else if (receive_timeout > 0)
1558 {
1559 os_non_restarting_signal(SIGALRM, data_timeout_handler);
1560 alarm(receive_timeout);
1561 }
1562
1563/* SIGTERM and SIGINT are caught always. */
1564
1565signal(SIGTERM, data_sigterm_sigint_handler);
1566signal(SIGINT, data_sigterm_sigint_handler);
1567
1568/* Header lines in messages are not supposed to be very long, though when
1569unfolded, to: and cc: headers can take up a lot of store. We must also cope
1570with the possibility of junk being thrown at us. Start by getting 256 bytes for
1571storing the header, and extend this as necessary using string_cat().
1572
1573To cope with total lunacies, impose an upper limit on the length of the header
1574section of the message, as otherwise the store will fill up. We must also cope
1575with the possibility of binary zeros in the data. Hence we cannot use fgets().
1576Folded header lines are joined into one string, leaving the '\n' characters
1577inside them, so that writing them out reproduces the input.
1578
1579Loop for each character of each header; the next structure for chaining the
1580header is set up already, with ptr the offset of the next character in
1581next->text. */
1582
1583for (;;)
1584 {
80a47a2c 1585 int ch = (receive_getc)();
059ec3d9
PH
1586
1587 /* If we hit EOF on a SMTP connection, it's an error, since incoming
1588 SMTP must have a correct "." terminator. */
1589
1590 if (ch == EOF && smtp_input /* && !smtp_batched_input */)
1591 {
1592 smtp_reply = handle_lost_connection(US" (header)");
1593 smtp_yield = FALSE;
1594 goto TIDYUP; /* Skip to end of function */
1595 }
1596
1597 /* See if we are at the current header's size limit - there must be at least
1598 four bytes left. This allows for the new character plus a zero, plus two for
1599 extra insertions when we are playing games with dots and carriage returns. If
1600 we are at the limit, extend the text buffer. This could have been done
1601 automatically using string_cat() but because this is a tightish loop storing
1602 only one character at a time, we choose to do it inline. Normally
1603 store_extend() will be able to extend the block; only at the end of a big
1604 store block will a copy be needed. To handle the case of very long headers
1605 (and sometimes lunatic messages can have ones that are 100s of K long) we
1606 call store_release() for strings that have been copied - if the string is at
1607 the start of a block (and therefore the only thing in it, because we aren't
1608 doing any other gets), the block gets freed. We can only do this because we
1609 know there are no other calls to store_get() going on. */
1610
1611 if (ptr >= header_size - 4)
1612 {
1613 int oldsize = header_size;
1614 /* header_size += 256; */
1615 header_size *= 2;
1616 if (!store_extend(next->text, oldsize, header_size))
1617 {
1618 uschar *newtext = store_get(header_size);
1619 memcpy(newtext, next->text, ptr);
1620 store_release(next->text);
1621 next->text = newtext;
1622 }
1623 }
1624
1625 /* Cope with receiving a binary zero. There is dispute about whether
1626 these should be allowed in RFC 822 messages. The middle view is that they
1627 should not be allowed in headers, at least. Exim takes this attitude at
1628 the moment. We can't just stomp on them here, because we don't know that
1629 this line is a header yet. Set a flag to cause scanning later. */
1630
1631 if (ch == 0) had_zero++;
1632
1633 /* Test for termination. Lines in remote SMTP are terminated by CRLF, while
1634 those from data files use just LF. Treat LF in local SMTP input as a
1635 terminator too. Treat EOF as a line terminator always. */
1636
1637 if (ch == EOF) goto EOL;
1638
1639 /* FUDGE: There are sites out there that don't send CRs before their LFs, and
1640 other MTAs accept this. We are therefore forced into this "liberalisation"
1641 too, so we accept LF as a line terminator whatever the source of the message.
1642 However, if the first line of the message ended with a CRLF, we treat a bare
1643 LF specially by inserting a white space after it to ensure that the header
1644 line is not terminated. */
1645
1646 if (ch == '\n')
1647 {
1648 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = FALSE;
80a47a2c 1649 else if (first_line_ended_crlf) receive_ungetc(' ');
059ec3d9
PH
1650 goto EOL;
1651 }
1652
1653 /* This is not the end of the line. If this is SMTP input and this is
1654 the first character in the line and it is a "." character, ignore it.
1655 This implements the dot-doubling rule, though header lines starting with
1656 dots aren't exactly common. They are legal in RFC 822, though. If the
1657 following is CRLF or LF, this is the line that that terminates the
1658 entire message. We set message_ended to indicate this has happened (to
1659 prevent further reading), and break out of the loop, having freed the
1660 empty header, and set next = NULL to indicate no data line. */
1661
1662 if (ptr == 0 && ch == '.' && (smtp_input || dot_ends))
1663 {
80a47a2c 1664 ch = (receive_getc)();
059ec3d9
PH
1665 if (ch == '\r')
1666 {
80a47a2c 1667 ch = (receive_getc)();
059ec3d9
PH
1668 if (ch != '\n')
1669 {
80a47a2c 1670 receive_ungetc(ch);
059ec3d9
PH
1671 ch = '\r'; /* Revert to CR */
1672 }
1673 }
1674 if (ch == '\n')
1675 {
1676 message_ended = END_DOT;
1677 store_reset(next);
1678 next = NULL;
1679 break; /* End character-reading loop */
1680 }
1681
1682 /* For non-SMTP input, the dot at the start of the line was really a data
1683 character. What is now in ch is the following character. We guaranteed
1684 enough space for this above. */
1685
1686 if (!smtp_input)
1687 {
1688 next->text[ptr++] = '.';
1689 message_size++;
1690 }
1691 }
1692
1693 /* If CR is immediately followed by LF, end the line, ignoring the CR, and
1694 remember this case if this is the first line ending. */
1695
1696 if (ch == '\r')
1697 {
80a47a2c 1698 ch = (receive_getc)();
059ec3d9
PH
1699 if (ch == '\n')
1700 {
1701 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = TRUE;
1702 goto EOL;
1703 }
1704
1705 /* Otherwise, put back the character after CR, and turn the bare CR
1706 into LF SP. */
1707
80a47a2c 1708 ch = (receive_ungetc)(ch);
059ec3d9
PH
1709 next->text[ptr++] = '\n';
1710 message_size++;
1711 ch = ' ';
1712 }
1713
1714 /* We have a data character for the header line. */
1715
1716 next->text[ptr++] = ch; /* Add to buffer */
1717 message_size++; /* Total message size so far */
1718
1719 /* Handle failure due to a humungously long header section. The >= allows
1720 for the terminating \n. Add what we have so far onto the headers list so
1721 that it gets reflected in any error message, and back up the just-read
1722 character. */
1723
1724 if (message_size >= header_maxsize)
1725 {
1726 next->text[ptr] = 0;
1727 next->slen = ptr;
1728 next->type = htype_other;
1729 next->next = NULL;
1730 header_last->next = next;
1731 header_last = next;
1732
1733 log_write(0, LOG_MAIN, "ridiculously long message header received from "
1734 "%s (more than %d characters): message abandoned",
1735 sender_host_unknown? sender_ident : sender_fullhost, header_maxsize);
1736
1737 if (smtp_input)
1738 {
1739 smtp_reply = US"552 Message header is ridiculously long";
1740 receive_swallow_smtp();
1741 goto TIDYUP; /* Skip to end of function */
1742 }
1743
1744 else
1745 {
1746 give_local_error(ERRMESS_VLONGHEADER,
1747 string_sprintf("message header longer than %d characters received: "
1748 "message not accepted", header_maxsize), US"", error_rc, stdin,
1749 header_list->next);
1750 /* Does not return */
1751 }
1752 }
1753
1754 continue; /* With next input character */
1755
1756 /* End of header line reached */
1757
1758 EOL:
2e0c1448
PH
1759
1760 /* Keep track of lines for BSMTP errors and overall message_linecount. */
1761
1762 receive_linecount++;
1763 message_linecount++;
059ec3d9 1764
d677b2f2
PH
1765 /* Keep track of maximum line length */
1766
1767 if (ptr - prevlines_length > max_received_linelength)
1768 max_received_linelength = ptr - prevlines_length;
1769 prevlines_length = ptr + 1;
1770
059ec3d9
PH
1771 /* Now put in the terminating newline. There is always space for
1772 at least two more characters. */
1773
1774 next->text[ptr++] = '\n';
1775 message_size++;
1776
1777 /* A blank line signals the end of the headers; release the unwanted
1778 space and set next to NULL to indicate this. */
1779
1780 if (ptr == 1)
1781 {
1782 store_reset(next);
1783 next = NULL;
1784 break;
1785 }
1786
1787 /* There is data in the line; see if the next input character is a
1788 whitespace character. If it is, we have a continuation of this header line.
1789 There is always space for at least one character at this point. */
1790
1791 if (ch != EOF)
1792 {
80a47a2c 1793 int nextch = (receive_getc)();
059ec3d9
PH
1794 if (nextch == ' ' || nextch == '\t')
1795 {
1796 next->text[ptr++] = nextch;
1797 message_size++;
1798 continue; /* Iterate the loop */
1799 }
80a47a2c 1800 else if (nextch != EOF) (receive_ungetc)(nextch); /* For next time */
059ec3d9
PH
1801 else ch = EOF; /* Cause main loop to exit at end */
1802 }
1803
1804 /* We have got to the real line end. Terminate the string and release store
1805 beyond it. If it turns out to be a real header, internal binary zeros will
1806 be squashed later. */
1807
1808 next->text[ptr] = 0;
1809 next->slen = ptr;
1810 store_reset(next->text + ptr + 1);
1811
1812 /* Check the running total size against the overall message size limit. We
1813 don't expect to fail here, but if the overall limit is set less than MESSAGE_
1814 MAXSIZE and a big header is sent, we want to catch it. Just stop reading
1815 headers - the code to read the body will then also hit the buffer. */
1816
1817 if (message_size > thismessage_size_limit) break;
1818
1819 /* A line that is not syntactically correct for a header also marks
1820 the end of the headers. In this case, we leave next containing the
1821 first data line. This might actually be several lines because of the
1822 continuation logic applied above, but that doesn't matter.
1823
1824 It turns out that smail, and presumably sendmail, accept leading lines
1825 of the form
1826
1827 From ph10 Fri Jan 5 12:35 GMT 1996
1828
1829 in messages. The "mail" command on Solaris 2 sends such lines. I cannot
1830 find any documentation of this, but for compatibility it had better be
1831 accepted. Exim restricts it to the case of non-smtp messages, and
1832 treats it as an alternative to the -f command line option. Thus it is
1833 ignored except for trusted users or filter testing. Otherwise it is taken
1834 as the sender address, unless -f was used (sendmail compatibility).
1835
1836 It further turns out that some UUCPs generate the From_line in a different
1837 format, e.g.
1838
1839 From ph10 Fri, 7 Jan 97 14:00:00 GMT
1840
1841 The regex for matching these things is now capable of recognizing both
1842 formats (including 2- and 4-digit years in the latter). In fact, the regex
1843 is now configurable, as is the expansion string to fish out the sender.
1844
1845 Even further on it has been discovered that some broken clients send
1846 these lines in SMTP messages. There is now an option to ignore them from
1847 specified hosts or networks. Sigh. */
1848
1849 if (header_last == header_list &&
1850 (!smtp_input
1851 ||
1852 (sender_host_address != NULL &&
1853 verify_check_host(&ignore_fromline_hosts) == OK)
1854 ||
1855 (sender_host_address == NULL && ignore_fromline_local)
1856 ) &&
1857 regex_match_and_setup(regex_From, next->text, 0, -1))
1858 {
1859 if (!sender_address_forced)
1860 {
1861 uschar *uucp_sender = expand_string(uucp_from_sender);
1862 if (uucp_sender == NULL)
1863 {
1864 log_write(0, LOG_MAIN|LOG_PANIC,
1865 "expansion of \"%s\" failed after matching "
1866 "\"From \" line: %s", uucp_from_sender, expand_string_message);
1867 }
1868 else
1869 {
1870 int start, end, domain;
1871 uschar *errmess;
1872 uschar *newsender = parse_extract_address(uucp_sender, &errmess,
1873 &start, &end, &domain, TRUE);
1874 if (newsender != NULL)
1875 {
1876 if (domain == 0 && newsender[0] != 0)
1877 newsender = rewrite_address_qualify(newsender, FALSE);
1878
f05da2e8 1879 if (filter_test != FTEST_NONE || receive_check_set_sender(newsender))
059ec3d9
PH
1880 {
1881 sender_address = newsender;
1882
f05da2e8 1883 if (trusted_caller || filter_test != FTEST_NONE)
059ec3d9
PH
1884 {
1885 authenticated_sender = NULL;
1886 originator_name = US"";
1887 sender_local = FALSE;
1888 }
1889
f05da2e8 1890 if (filter_test != FTEST_NONE)
059ec3d9
PH
1891 printf("Sender taken from \"From \" line\n");
1892 }
1893 }
1894 }
1895 }
1896 }
1897
1898 /* Not a leading "From " line. Check to see if it is a valid header line.
1899 Header names may contain any non-control characters except space and colon,
1900 amazingly. */
1901
1902 else
1903 {
1904 uschar *p = next->text;
1905
1906 /* If not a valid header line, break from the header reading loop, leaving
1907 next != NULL, indicating that it holds the first line of the body. */
1908
1909 if (isspace(*p)) break;
1910 while (mac_isgraph(*p) && *p != ':') p++;
1911 while (isspace(*p)) p++;
1912 if (*p != ':')
1913 {
1914 body_zerocount = had_zero;
1915 break;
1916 }
1917
1918 /* We have a valid header line. If there were any binary zeroes in
1919 the line, stomp on them here. */
1920
1921 if (had_zero > 0)
1922 for (p = next->text; p < next->text + ptr; p++) if (*p == 0) *p = '?';
1923
1924 /* It is perfectly legal to have an empty continuation line
1925 at the end of a header, but it is confusing to humans
1926 looking at such messages, since it looks like a blank line.
1927 Reduce confusion by removing redundant white space at the
1928 end. We know that there is at least one printing character
1929 (the ':' tested for above) so there is no danger of running
1930 off the end. */
1931
1932 p = next->text + ptr - 2;
1933 for (;;)
1934 {
1935 while (*p == ' ' || *p == '\t') p--;
1936 if (*p != '\n') break;
1937 ptr = (p--) - next->text + 1;
1938 message_size -= next->slen - ptr;
1939 next->text[ptr] = 0;
1940 next->slen = ptr;
1941 }
1942
1943 /* Add the header to the chain */
1944
1945 next->type = htype_other;
1946 next->next = NULL;
1947 header_last->next = next;
1948 header_last = next;
1949
1950 /* Check the limit for individual line lengths. This comes after adding to
1951 the chain so that the failing line is reflected if a bounce is generated
1952 (for a local message). */
1953
1954 if (header_line_maxsize > 0 && next->slen > header_line_maxsize)
1955 {
1956 log_write(0, LOG_MAIN, "overlong message header line received from "
1957 "%s (more than %d characters): message abandoned",
1958 sender_host_unknown? sender_ident : sender_fullhost,
1959 header_line_maxsize);
1960
1961 if (smtp_input)
1962 {
1963 smtp_reply = US"552 A message header line is too long";
1964 receive_swallow_smtp();
1965 goto TIDYUP; /* Skip to end of function */
1966 }
1967
1968 else
1969 {
1970 give_local_error(ERRMESS_VLONGHDRLINE,
1971 string_sprintf("message header line longer than %d characters "
1972 "received: message not accepted", header_line_maxsize), US"",
1973 error_rc, stdin, header_list->next);
1974 /* Does not return */
1975 }
1976 }
1977
1978 /* Note if any resent- fields exist. */
1979
1980 if (!resents_exist && strncmpic(next->text, US"resent-", 7) == 0)
1981 {
1982 resents_exist = TRUE;
1983 resent_prefix = US"Resent-";
1984 }
1985 }
1986
1987 /* The line has been handled. If we have hit EOF, break out of the loop,
1988 indicating no pending data line. */
1989
1990 if (ch == EOF) { next = NULL; break; }
1991
1992 /* Set up for the next header */
1993
1994 header_size = 256;
1995 next = store_get(sizeof(header_line));
1996 next->text = store_get(header_size);
1997 ptr = 0;
1998 had_zero = 0;
d677b2f2 1999 prevlines_length = 0;
059ec3d9
PH
2000 } /* Continue, starting to read the next header */
2001
2002/* At this point, we have read all the headers into a data structure in main
2003store. The first header is still the dummy placeholder for the Received: header
2004we are going to generate a bit later on. If next != NULL, it contains the first
2005data line - which terminated the headers before reaching a blank line (not the
2006normal case). */
2007
2008DEBUG(D_receive)
2009 {
2010 debug_printf(">>Headers received:\n");
2011 for (h = header_list->next; h != NULL; h = h->next)
2012 debug_printf("%s", h->text);
2013 debug_printf("\n");
2014 }
2015
2016/* End of file on any SMTP connection is an error. If an incoming SMTP call
2017is dropped immediately after valid headers, the next thing we will see is EOF.
2018We must test for this specially, as further down the reading of the data is
2019skipped if already at EOF. */
2020
2021if (smtp_input && (receive_feof)())
2022 {
2023 smtp_reply = handle_lost_connection(US" (after header)");
2024 smtp_yield = FALSE;
2025 goto TIDYUP; /* Skip to end of function */
2026 }
2027
2028/* If this is a filter test run and no headers were read, output a warning
2029in case there is a mistake in the test message. */
2030
f05da2e8 2031if (filter_test != FTEST_NONE && header_list->next == NULL)
059ec3d9
PH
2032 printf("Warning: no message headers read\n");
2033
2034
2035/* Scan the headers to identify them. Some are merely marked for later
2036processing; some are dealt with here. */
2037
2038for (h = header_list->next; h != NULL; h = h->next)
2039 {
2040 BOOL is_resent = strncmpic(h->text, US"resent-", 7) == 0;
2041 if (is_resent) contains_resent_headers = TRUE;
2042
2043 switch (header_checkname(h, is_resent))
2044 {
059ec3d9 2045 case htype_bcc:
2cbb4081 2046 h->type = htype_bcc; /* Both Bcc: and Resent-Bcc: */
059ec3d9
PH
2047 break;
2048
059ec3d9 2049 case htype_cc:
2cbb4081 2050 h->type = htype_cc; /* Both Cc: and Resent-Cc: */
059ec3d9
PH
2051 break;
2052
2053 /* Record whether a Date: or Resent-Date: header exists, as appropriate. */
2054
2055 case htype_date:
4c69d561 2056 if (!resents_exist || is_resent) date_header_exists = TRUE;
059ec3d9
PH
2057 break;
2058
2059 /* Same comments as about Return-Path: below. */
2060
2061 case htype_delivery_date:
2062 if (delivery_date_remove) h->type = htype_old;
2063 break;
2064
2065 /* Same comments as about Return-Path: below. */
2066
2067 case htype_envelope_to:
2068 if (envelope_to_remove) h->type = htype_old;
2069 break;
2070
2071 /* Mark all "From:" headers so they get rewritten. Save the one that is to
2072 be used for Sender: checking. For Sendmail compatibility, if the "From:"
2073 header consists of just the login id of the user who called Exim, rewrite
2074 it with the gecos field first. Apply this rule to Resent-From: if there
2075 are resent- fields. */
2076
2077 case htype_from:
2078 h->type = htype_from;
2079 if (!resents_exist || is_resent)
2080 {
2081 from_header = h;
2082 if (!smtp_input)
2083 {
5de8faa3 2084 int len;
059ec3d9
PH
2085 uschar *s = Ustrchr(h->text, ':') + 1;
2086 while (isspace(*s)) s++;
5de8faa3 2087 len = h->slen - (s - h->text) - 1;
e0fccd1d
TF
2088 if (Ustrlen(originator_login) == len &&
2089 strncmpic(s, originator_login, len) == 0)
059ec3d9
PH
2090 {
2091 uschar *name = is_resent? US"Resent-From" : US"From";
2092 header_add(htype_from, "%s: %s <%s@%s>\n", name, originator_name,
2093 originator_login, qualify_domain_sender);
2094 from_header = header_last;
2095 h->type = htype_old;
2096 DEBUG(D_receive|D_rewrite)
2097 debug_printf("rewrote \"%s:\" header using gecos\n", name);
2098 }
2099 }
2100 }
2101 break;
2102
2103 /* Identify the Message-id: header for generating "in-reply-to" in the
2104 autoreply transport. For incoming logging, save any resent- value. In both
2105 cases, take just the first of any multiples. */
2106
2107 case htype_id:
2108 if (msgid_header == NULL && (!resents_exist || is_resent))
2109 {
2110 msgid_header = h;
2111 h->type = htype_id;
2112 }
2113 break;
2114
2115 /* Flag all Received: headers */
2116
2117 case htype_received:
2118 h->type = htype_received;
2119 received_count++;
2120 break;
2121
2122 /* "Reply-to:" is just noted (there is no resent-reply-to field) */
2123
2124 case htype_reply_to:
2125 h->type = htype_reply_to;
2126 break;
2127
2128 /* The Return-path: header is supposed to be added to messages when
2129 they leave the SMTP system. We shouldn't receive messages that already
2130 contain Return-path. However, since Exim generates Return-path: on
2131 local delivery, resent messages may well contain it. We therefore
2132 provide an option (which defaults on) to remove any Return-path: headers
2133 on input. Removal actually means flagging as "old", which prevents the
2134 header being transmitted with the message. */
2135
2136 case htype_return_path:
2137 if (return_path_remove) h->type = htype_old;
2138
2139 /* If we are testing a mail filter file, use the value of the
2140 Return-Path: header to set up the return_path variable, which is not
2141 otherwise set. However, remove any <> that surround the address
2142 because the variable doesn't have these. */
2143
f05da2e8 2144 if (filter_test != FTEST_NONE)
059ec3d9
PH
2145 {
2146 uschar *start = h->text + 12;
2147 uschar *end = start + Ustrlen(start);
2148 while (isspace(*start)) start++;
2149 while (end > start && isspace(end[-1])) end--;
2150 if (*start == '<' && end[-1] == '>')
2151 {
2152 start++;
2153 end--;
2154 }
2155 return_path = string_copyn(start, end - start);
2156 printf("Return-path taken from \"Return-path:\" header line\n");
2157 }
2158 break;
2159
2160 /* If there is a "Sender:" header and the message is locally originated,
8800895a
PH
2161 and from an untrusted caller and suppress_local_fixups is not set, or if we
2162 are in submission mode for a remote message, mark it "old" so that it will
2163 not be transmitted with the message, unless active_local_sender_retain is
2164 set. (This can only be true if active_local_from_check is false.) If there
2165 are any resent- headers in the message, apply this rule to Resent-Sender:
2166 instead of Sender:. Messages with multiple resent- header sets cannot be
2167 tidily handled. (For this reason, at least one MUA - Pine - turns old
2168 resent- headers into X-resent- headers when resending, leaving just one
2169 set.) */
059ec3d9
PH
2170
2171 case htype_sender:
69358f02 2172 h->type = ((!active_local_sender_retain &&
8800895a
PH
2173 (
2174 (sender_local && !trusted_caller && !suppress_local_fixups)
2175 || submission_mode
2176 )
059ec3d9
PH
2177 ) &&
2178 (!resents_exist||is_resent))?
2179 htype_old : htype_sender;
2180 break;
2181
2182 /* Remember the Subject: header for logging. There is no Resent-Subject */
2183
2184 case htype_subject:
2185 subject_header = h;
2186 break;
2187
2188 /* "To:" gets flagged, and the existence of a recipient header is noted,
2189 whether it's resent- or not. */
2190
2191 case htype_to:
2192 h->type = htype_to;
2193 /****
2194 to_or_cc_header_exists = TRUE;
2195 ****/
2196 break;
2197 }
2198 }
2199
2200/* Extract recipients from the headers if that is required (the -t option).
2201Note that this is documented as being done *before* any address rewriting takes
2202place. There are two possibilities:
2203
2204(1) According to sendmail documentation for Solaris, IRIX, and HP-UX, any
2205recipients already listed are to be REMOVED from the message. Smail 3 works
2206like this. We need to build a non-recipients tree for that list, because in
2207subsequent processing this data is held in a tree and that's what the
2208spool_write_header() function expects. Make sure that non-recipient addresses
2209are fully qualified and rewritten if necessary.
2210
2211(2) According to other sendmail documentation, -t ADDS extracted recipients to
2212those in the command line arguments (and it is rumoured some other MTAs do
2213this). Therefore, there is an option to make Exim behave this way.
2214
2215*** Notes on "Resent-" header lines ***
2216
2217The presence of resent-headers in the message makes -t horribly ambiguous.
2218Experiments with sendmail showed that it uses recipients for all resent-
2219headers, totally ignoring the concept of "sets of resent- headers" as described
2220in RFC 2822 section 3.6.6. Sendmail also amalgamates them into a single set
2221with all the addresses in one instance of each header.
2222
2223This seems to me not to be at all sensible. Before release 4.20, Exim 4 gave an
2224error for -t if there were resent- headers in the message. However, after a
2225discussion on the mailing list, I've learned that there are MUAs that use
2226resent- headers with -t, and also that the stuff about sets of resent- headers
2227and their ordering in RFC 2822 is generally ignored. An MUA that submits a
2228message with -t and resent- header lines makes sure that only *its* resent-
2229headers are present; previous ones are often renamed as X-resent- for example.
2230
2231Consequently, Exim has been changed so that, if any resent- header lines are
2232present, the recipients are taken from all of the appropriate resent- lines,
2233and not from the ordinary To:, Cc:, etc. */
2234
2235if (extract_recip)
2236 {
2237 int rcount = 0;
2238 error_block **bnext = &bad_addresses;
2239
2240 if (extract_addresses_remove_arguments)
2241 {
2242 while (recipients_count-- > 0)
2243 {
2244 uschar *s = rewrite_address(recipients_list[recipients_count].address,
2245 TRUE, TRUE, global_rewrite_rules, rewrite_existflags);
2246 tree_add_nonrecipient(s);
2247 }
2248 recipients_list = NULL;
2249 recipients_count = recipients_list_max = 0;
2250 }
2251
059ec3d9
PH
2252 /* Now scan the headers */
2253
2254 for (h = header_list->next; h != NULL; h = h->next)
2255 {
2256 if ((h->type == htype_to || h->type == htype_cc || h->type == htype_bcc) &&
2257 (!contains_resent_headers || strncmpic(h->text, US"resent-", 7) == 0))
2258 {
2259 uschar *s = Ustrchr(h->text, ':') + 1;
2260 while (isspace(*s)) s++;
2261
1eccaa59
PH
2262 parse_allow_group = TRUE; /* Allow address group syntax */
2263
059ec3d9
PH
2264 while (*s != 0)
2265 {
2266 uschar *ss = parse_find_address_end(s, FALSE);
2267 uschar *recipient, *errmess, *p, *pp;
2268 int start, end, domain;
2269
2270 /* Check on maximum */
2271
2272 if (recipients_max > 0 && ++rcount > recipients_max)
2273 {
2274 give_local_error(ERRMESS_TOOMANYRECIP, US"too many recipients",
2275 US"message rejected: ", error_rc, stdin, NULL);
2276 /* Does not return */
2277 }
2278
2279 /* Make a copy of the address, and remove any internal newlines. These
2280 may be present as a result of continuations of the header line. The
2281 white space that follows the newline must not be removed - it is part
2282 of the header. */
2283
2284 pp = recipient = store_get(ss - s + 1);
2285 for (p = s; p < ss; p++) if (*p != '\n') *pp++ = *p;
2286 *pp = 0;
2287 recipient = parse_extract_address(recipient, &errmess, &start, &end,
2288 &domain, FALSE);
2289
2290 /* Keep a list of all the bad addresses so we can send a single
2291 error message at the end. However, an empty address is not an error;
2292 just ignore it. This can come from an empty group list like
2293
2294 To: Recipients of list:;
2295
2296 If there are no recipients at all, an error will occur later. */
2297
2298 if (recipient == NULL && Ustrcmp(errmess, "empty address") != 0)
2299 {
2300 int len = Ustrlen(s);
2301 error_block *b = store_get(sizeof(error_block));
2302 while (len > 0 && isspace(s[len-1])) len--;
2303 b->next = NULL;
2304 b->text1 = string_printing(string_copyn(s, len));
2305 b->text2 = errmess;
2306 *bnext = b;
2307 bnext = &(b->next);
2308 }
2309
2310 /* If the recipient is already in the nonrecipients tree, it must
2311 have appeared on the command line with the option extract_addresses_
2312 remove_arguments set. Do not add it to the recipients, and keep a note
2313 that this has happened, in order to give a better error if there are
2314 no recipients left. */
2315
2316 else if (recipient != NULL)
2317 {
2318 if (tree_search(tree_nonrecipients, recipient) == NULL)
2319 receive_add_recipient(recipient, -1);
2320 else
2321 extracted_ignored = TRUE;
2322 }
2323
2324 /* Move on past this address */
2325
2326 s = ss + (*ss? 1:0);
2327 while (isspace(*s)) s++;
1eccaa59
PH
2328 } /* Next address */
2329
2330 parse_allow_group = FALSE; /* Reset group syntax flags */
2331 parse_found_group = FALSE;
059ec3d9
PH
2332
2333 /* If this was the bcc: header, mark it "old", which means it
2334 will be kept on the spool, but not transmitted as part of the
2335 message. */
2336
2cbb4081 2337 if (h->type == htype_bcc) h->type = htype_old;
059ec3d9
PH
2338 } /* For appropriate header line */
2339 } /* For each header line */
2340
059ec3d9
PH
2341 }
2342
2343/* Now build the unique message id. This has changed several times over the
2344lifetime of Exim. This description was rewritten for Exim 4.14 (February 2003).
2345Retaining all the history in the comment has become too unwieldy - read
2346previous release sources if you want it.
2347
2348The message ID has 3 parts: tttttt-pppppp-ss. Each part is a number in base 62.
2349The first part is the current time, in seconds. The second part is the current
2350pid. Both are large enough to hold 32-bit numbers in base 62. The third part
2351can hold a number in the range 0-3843. It used to be a computed sequence
2352number, but is now the fractional component of the current time in units of
23531/2000 of a second (i.e. a value in the range 0-1999). After a message has been
2354received, Exim ensures that the timer has ticked at the appropriate level
2355before proceeding, to avoid duplication if the pid happened to be re-used
2356within the same time period. It seems likely that most messages will take at
2357least half a millisecond to be received, so no delay will normally be
2358necessary. At least for some time...
2359
2360There is a modification when localhost_number is set. Formerly this was allowed
2361to be as large as 255. Now it is restricted to the range 0-16, and the final
2362component of the message id becomes (localhost_number * 200) + fractional time
2363in units of 1/200 of a second (i.e. a value in the range 0-3399).
2364
2365Some not-really-Unix operating systems use case-insensitive file names (Darwin,
2366Cygwin). For these, we have to use base 36 instead of base 62. Luckily, this
2367still allows the tttttt field to hold a large enough number to last for some
2368more decades, and the final two-digit field can hold numbers up to 1295, which
2369is enough for milliseconds (instead of 1/2000 of a second).
2370
2371However, the pppppp field cannot hold a 32-bit pid, but it can hold a 31-bit
2372pid, so it is probably safe because pids have to be positive. The
2373localhost_number is restricted to 0-10 for these hosts, and when it is set, the
2374final field becomes (localhost_number * 100) + fractional time in centiseconds.
2375
2376Note that string_base62() returns its data in a static storage block, so it
2377must be copied before calling string_base62() again. It always returns exactly
23786 characters.
2379
2380There doesn't seem to be anything in the RFC which requires a message id to
2381start with a letter, but Smail was changed to ensure this. The external form of
2382the message id (as supplied by string expansion) therefore starts with an
2383additional leading 'E'. The spool file names do not include this leading
2384letter and it is not used internally.
2385
2386NOTE: If ever the format of message ids is changed, the regular expression for
2387checking that a string is in this format must be updated in a corresponding
2388way. It appears in the initializing code in exim.c. The macro MESSAGE_ID_LENGTH
2389must also be changed to reflect the correct string length. Then, of course,
2390other programs that rely on the message id format will need updating too. */
2391
2392Ustrncpy(message_id, string_base62((long int)(message_id_tv.tv_sec)), 6);
2393message_id[6] = '-';
2394Ustrncpy(message_id + 7, string_base62((long int)getpid()), 6);
2395
2396/* Deal with the case where the host number is set. The value of the number was
2397checked when it was read, to ensure it isn't too big. The timing granularity is
2398left in id_resolution so that an appropriate wait can be done after receiving
2399the message, if necessary (we hope it won't be). */
2400
2401if (host_number_string != NULL)
2402 {
2403 id_resolution = (BASE_62 == 62)? 5000 : 10000;
2404 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2405 string_base62((long int)(
2406 host_number * (1000000/id_resolution) +
2407 message_id_tv.tv_usec/id_resolution)) + 4);
2408 }
2409
2410/* Host number not set: final field is just the fractional time at an
2411appropriate resolution. */
2412
2413else
2414 {
2415 id_resolution = (BASE_62 == 62)? 500 : 1000;
2416 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2417 string_base62((long int)(message_id_tv.tv_usec/id_resolution)) + 4);
2418 }
2419
2420/* Add the current message id onto the current process info string if
2421it will fit. */
2422
2423(void)string_format(process_info + process_info_len,
2424 PROCESS_INFO_SIZE - process_info_len, " id=%s", message_id);
2425
2426/* If we are using multiple input directories, set up the one for this message
2427to be the least significant base-62 digit of the time of arrival. Otherwise
2428ensure that it is an empty string. */
2429
2430message_subdir[0] = split_spool_directory? message_id[5] : 0;
2431
2432/* Now that we have the message-id, if there is no message-id: header, generate
8800895a
PH
2433one, but only for local (without suppress_local_fixups) or submission mode
2434messages. This can be user-configured if required, but we had better flatten
2435any illegal characters therein. */
059ec3d9 2436
8800895a
PH
2437if (msgid_header == NULL &&
2438 ((sender_host_address == NULL && !suppress_local_fixups)
2439 || submission_mode))
059ec3d9
PH
2440 {
2441 uschar *p;
2442 uschar *id_text = US"";
2443 uschar *id_domain = primary_hostname;
2444
2445 /* Permit only letters, digits, dots, and hyphens in the domain */
2446
2447 if (message_id_domain != NULL)
2448 {
2449 uschar *new_id_domain = expand_string(message_id_domain);
2450 if (new_id_domain == NULL)
2451 {
2452 if (!expand_string_forcedfail)
2453 log_write(0, LOG_MAIN|LOG_PANIC,
2454 "expansion of \"%s\" (message_id_header_domain) "
2455 "failed: %s", message_id_domain, expand_string_message);
2456 }
2457 else if (*new_id_domain != 0)
2458 {
2459 id_domain = new_id_domain;
2460 for (p = id_domain; *p != 0; p++)
2461 if (!isalnum(*p) && *p != '.') *p = '-'; /* No need to test '-' ! */
2462 }
2463 }
2464
2465 /* Permit all characters except controls and RFC 2822 specials in the
2466 additional text part. */
2467
2468 if (message_id_text != NULL)
2469 {
2470 uschar *new_id_text = expand_string(message_id_text);
2471 if (new_id_text == NULL)
2472 {
2473 if (!expand_string_forcedfail)
2474 log_write(0, LOG_MAIN|LOG_PANIC,
2475 "expansion of \"%s\" (message_id_header_text) "
2476 "failed: %s", message_id_text, expand_string_message);
2477 }
2478 else if (*new_id_text != 0)
2479 {
2480 id_text = new_id_text;
2481 for (p = id_text; *p != 0; p++)
2482 if (mac_iscntrl_or_special(*p)) *p = '-';
2483 }
2484 }
2485
e7e680d6
PP
2486 /* Add the header line
2487 * Resent-* headers are prepended, per RFC 5322 3.6.6. Non-Resent-* are
2488 * appended, to preserve classical expectations of header ordering. */
059ec3d9 2489
e7e680d6 2490 header_add_at_position(!resents_exist, NULL, FALSE, htype_id,
5eb690a1
NM
2491 "%sMessage-Id: <%s%s%s@%s>\n", resent_prefix, message_id_external,
2492 (*id_text == 0)? "" : ".", id_text, id_domain);
059ec3d9
PH
2493 }
2494
2495/* If we are to log recipients, keep a copy of the raw ones before any possible
2496rewriting. Must copy the count, because later ACLs and the local_scan()
2497function may mess with the real recipients. */
2498
2499if ((log_extra_selector & LX_received_recipients) != 0)
2500 {
2501 raw_recipients = store_get(recipients_count * sizeof(uschar *));
2502 for (i = 0; i < recipients_count; i++)
2503 raw_recipients[i] = string_copy(recipients_list[i].address);
2504 raw_recipients_count = recipients_count;
2505 }
2506
2507/* Ensure the recipients list is fully qualified and rewritten. Unqualified
2508recipients will get here only if the conditions were right (allow_unqualified_
2509recipient is TRUE). */
2510
2511for (i = 0; i < recipients_count; i++)
2512 recipients_list[i].address =
2513 rewrite_address(recipients_list[i].address, TRUE, TRUE,
2514 global_rewrite_rules, rewrite_existflags);
2515
8800895a
PH
2516/* If there is no From: header, generate one for local (without
2517suppress_local_fixups) or submission_mode messages. If there is no sender
2518address, but the sender is local or this is a local delivery error, use the
2519originator login. This shouldn't happen for genuine bounces, but might happen
2520for autoreplies. The addition of From: must be done *before* checking for the
2521possible addition of a Sender: header, because untrusted_set_sender allows an
2522untrusted user to set anything in the envelope (which might then get info
2523From:) but we still want to ensure a valid Sender: if it is required. */
2524
2525if (from_header == NULL &&
2526 ((sender_host_address == NULL && !suppress_local_fixups)
2527 || submission_mode))
059ec3d9 2528 {
2fe1a124
PH
2529 uschar *oname = US"";
2530
2531 /* Use the originator_name if this is a locally submitted message and the
2532 caller is not trusted. For trusted callers, use it only if -F was used to
2533 force its value or if we have a non-SMTP message for which -f was not used
2534 to set the sender. */
2535
2536 if (sender_host_address == NULL)
2537 {
2538 if (!trusted_caller || sender_name_forced ||
2539 (!smtp_input && !sender_address_forced))
2540 oname = originator_name;
2541 }
2542
2543 /* For non-locally submitted messages, the only time we use the originator
2544 name is when it was forced by the /name= option on control=submission. */
2545
2546 else
2547 {
2548 if (submission_name != NULL) oname = submission_name;
2549 }
2550
059ec3d9
PH
2551 /* Envelope sender is empty */
2552
2553 if (sender_address[0] == 0)
2554 {
87ba3f5f
PH
2555 uschar *fromstart, *fromend;
2556
2557 fromstart = string_sprintf("%sFrom: %s%s", resent_prefix,
2fe1a124
PH
2558 oname, (oname[0] == 0)? "" : " <");
2559 fromend = (oname[0] == 0)? US"" : US">";
87ba3f5f 2560
059ec3d9
PH
2561 if (sender_local || local_error_message)
2562 {
87ba3f5f
PH
2563 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2564 local_part_quote(originator_login), qualify_domain_sender,
2565 fromend);
059ec3d9
PH
2566 }
2567 else if (submission_mode && authenticated_id != NULL)
2568 {
2569 if (submission_domain == NULL)
2570 {
87ba3f5f
PH
2571 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2572 local_part_quote(authenticated_id), qualify_domain_sender,
2573 fromend);
059ec3d9
PH
2574 }
2575 else if (submission_domain[0] == 0) /* empty => whole address set */
2576 {
87ba3f5f
PH
2577 header_add(htype_from, "%s%s%s\n", fromstart, authenticated_id,
2578 fromend);
059ec3d9
PH
2579 }
2580 else
2581 {
87ba3f5f
PH
2582 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2583 local_part_quote(authenticated_id), submission_domain,
2584 fromend);
059ec3d9
PH
2585 }
2586 from_header = header_last; /* To get it checked for Sender: */
2587 }
2588 }
2589
2590 /* There is a non-null envelope sender. Build the header using the original
2591 sender address, before any rewriting that might have been done while
2592 verifying it. */
2593
2594 else
2595 {
87ba3f5f 2596 header_add(htype_from, "%sFrom: %s%s%s%s\n", resent_prefix,
2fe1a124
PH
2597 oname,
2598 (oname[0] == 0)? "" : " <",
87ba3f5f
PH
2599 (sender_address_unrewritten == NULL)?
2600 sender_address : sender_address_unrewritten,
2fe1a124 2601 (oname[0] == 0)? "" : ">");
059ec3d9
PH
2602
2603 from_header = header_last; /* To get it checked for Sender: */
2604 }
2605 }
2606
2607
8800895a
PH
2608/* If the sender is local (without suppress_local_fixups), or if we are in
2609submission mode and there is an authenticated_id, check that an existing From:
2610is correct, and if not, generate a Sender: header, unless disabled. Any
2611previously-existing Sender: header was removed above. Note that sender_local,
2612as well as being TRUE if the caller of exim is not trusted, is also true if a
2613trusted caller did not supply a -f argument for non-smtp input. To allow
2614trusted callers to forge From: without supplying -f, we have to test explicitly
2615here. If the From: header contains more than one address, then the call to
2616parse_extract_address fails, and a Sender: header is inserted, as required. */
059ec3d9
PH
2617
2618if (from_header != NULL &&
69358f02 2619 (active_local_from_check &&
8800895a 2620 ((sender_local && !trusted_caller && !suppress_local_fixups) ||
69358f02 2621 (submission_mode && authenticated_id != NULL))
059ec3d9
PH
2622 ))
2623 {
2624 BOOL make_sender = TRUE;
2625 int start, end, domain;
2626 uschar *errmess;
2627 uschar *from_address =
2628 parse_extract_address(Ustrchr(from_header->text, ':') + 1, &errmess,
2629 &start, &end, &domain, FALSE);
2630 uschar *generated_sender_address;
2631
2632 if (submission_mode)
2633 {
2634 if (submission_domain == NULL)
2635 {
2636 generated_sender_address = string_sprintf("%s@%s",
2637 local_part_quote(authenticated_id), qualify_domain_sender);
2638 }
2639 else if (submission_domain[0] == 0) /* empty => full address */
2640 {
2641 generated_sender_address = string_sprintf("%s",
2642 authenticated_id);
2643 }
2644 else
2645 {
2646 generated_sender_address = string_sprintf("%s@%s",
2647 local_part_quote(authenticated_id), submission_domain);
2648 }
2649 }
2650 else
2651 generated_sender_address = string_sprintf("%s@%s",
2652 local_part_quote(originator_login), qualify_domain_sender);
2653
2654 /* Remove permitted prefixes and suffixes from the local part of the From:
2655 address before doing the comparison with the generated sender. */
2656
2657 if (from_address != NULL)
2658 {
2659 int slen;
2660 uschar *at = (domain == 0)? NULL : from_address + domain - 1;
2661
2662 if (at != NULL) *at = 0;
2663 from_address += route_check_prefix(from_address, local_from_prefix);
2664 slen = route_check_suffix(from_address, local_from_suffix);
2665 if (slen > 0)
2666 {
2667 memmove(from_address+slen, from_address, Ustrlen(from_address)-slen);
2668 from_address += slen;
2669 }
2670 if (at != NULL) *at = '@';
2671
2672 if (strcmpic(generated_sender_address, from_address) == 0 ||
2673 (domain == 0 && strcmpic(from_address, originator_login) == 0))
2674 make_sender = FALSE;
2675 }
2676
2677 /* We have to cause the Sender header to be rewritten if there are
2678 appropriate rewriting rules. */
2679
2680 if (make_sender)
2681 {
2fe1a124 2682 if (submission_mode && submission_name == NULL)
059ec3d9
PH
2683 header_add(htype_sender, "%sSender: %s\n", resent_prefix,
2684 generated_sender_address);
2685 else
2686 header_add(htype_sender, "%sSender: %s <%s>\n",
2fe1a124
PH
2687 resent_prefix,
2688 submission_mode? submission_name : originator_name,
2689 generated_sender_address);
059ec3d9 2690 }
87ba3f5f
PH
2691
2692 /* Ensure that a non-null envelope sender address corresponds to the
2693 submission mode sender address. */
2694
2695 if (submission_mode && sender_address[0] != 0)
2696 {
2697 if (sender_address_unrewritten == NULL)
2698 sender_address_unrewritten = sender_address;
2699 sender_address = generated_sender_address;
089793a4
TF
2700 if (Ustrcmp(sender_address_unrewritten, generated_sender_address) != 0)
2701 log_write(L_address_rewrite, LOG_MAIN,
2702 "\"%s\" from env-from rewritten as \"%s\" by submission mode",
2703 sender_address_unrewritten, generated_sender_address);
87ba3f5f 2704 }
059ec3d9
PH
2705 }
2706
2707
2708/* If there are any rewriting rules, apply them to the sender address, unless
2709it has already been rewritten as part of verification for SMTP input. */
2710
2711if (global_rewrite_rules != NULL && sender_address_unrewritten == NULL &&
2712 sender_address[0] != 0)
2713 {
2714 sender_address = rewrite_address(sender_address, FALSE, TRUE,
2715 global_rewrite_rules, rewrite_existflags);
2716 DEBUG(D_receive|D_rewrite)
2717 debug_printf("rewritten sender = %s\n", sender_address);
2718 }
2719
2720
2721/* The headers must be run through rewrite_header(), because it ensures that
2722addresses are fully qualified, as well as applying any rewriting rules that may
2723exist.
2724
2725Qualification of header addresses in a message from a remote host happens only
2726if the host is in sender_unqualified_hosts or recipient_unqualified hosts, as
2727appropriate. For local messages, qualification always happens, unless -bnq is
2728used to explicitly suppress it. No rewriting is done for an unqualified address
2729that is left untouched.
2730
2731We start at the second header, skipping our own Received:. This rewriting is
2732documented as happening *after* recipient addresses are taken from the headers
2733by the -t command line option. An added Sender: gets rewritten here. */
2734
2735for (h = header_list->next; h != NULL; h = h->next)
2736 {
2737 header_line *newh = rewrite_header(h, NULL, NULL, global_rewrite_rules,
2738 rewrite_existflags, TRUE);
2739 if (newh != NULL) h = newh;
2740 }
2741
2742
2743/* An RFC 822 (sic) message is not legal unless it has at least one of "to",
2cbb4081 2744"cc", or "bcc". Note that although the minimal examples in RFC 822 show just
059ec3d9
PH
2745"to" or "bcc", the full syntax spec allows "cc" as well. If any resent- header
2746exists, this applies to the set of resent- headers rather than the normal set.
2747
2cbb4081
PH
2748The requirement for a recipient header has been removed in RFC 2822. At this
2749point in the code, earlier versions of Exim added a To: header for locally
2750submitted messages, and an empty Bcc: header for others. In the light of the
2751changes in RFC 2822, this was dropped in November 2003. */
059ec3d9 2752
059ec3d9
PH
2753
2754/* If there is no date header, generate one if the message originates locally
8800895a
PH
2755(i.e. not over TCP/IP) and suppress_local_fixups is not set, or if the
2756submission mode flag is set. Messages without Date: are not valid, but it seems
e7e680d6
PP
2757to be more confusing if Exim adds one to all remotely-originated messages.
2758As per Message-Id, we prepend if resending, else append.
2759*/
059ec3d9 2760
8800895a
PH
2761if (!date_header_exists &&
2762 ((sender_host_address == NULL && !suppress_local_fixups)
2763 || submission_mode))
e7e680d6
PP
2764 header_add_at_position(!resents_exist, NULL, FALSE, htype_other,
2765 "%sDate: %s\n", resent_prefix, tod_stamp(tod_full));
059ec3d9
PH
2766
2767search_tidyup(); /* Free any cached resources */
2768
2769/* Show the complete set of headers if debugging. Note that the first one (the
2770new Received:) has not yet been set. */
2771
2772DEBUG(D_receive)
2773 {
2774 debug_printf(">>Headers after rewriting and local additions:\n");
2775 for (h = header_list->next; h != NULL; h = h->next)
2776 debug_printf("%c %s", h->type, h->text);
2777 debug_printf("\n");
2778 }
2779
2780/* The headers are now complete in store. If we are running in filter
2781testing mode, that is all this function does. Return TRUE if the message
2782ended with a dot. */
2783
f05da2e8 2784if (filter_test != FTEST_NONE)
059ec3d9
PH
2785 {
2786 process_info[process_info_len] = 0;
2787 return message_ended == END_DOT;
2788 }
2789
817d9f57 2790/* Cutthrough delivery:
e4bdf652
JH
2791 We have to create the Received header now rather than at the end of reception,
2792 so the timestamp behaviour is a change to the normal case.
2793 XXX Ensure this gets documented XXX.
817d9f57 2794 Having created it, send the headers to the destination.
e4bdf652
JH
2795*/
2796if (cutthrough_fd >= 0)
2797 {
817d9f57
JH
2798 if (received_count > received_headers_max)
2799 {
2e5b33cd 2800 cancel_cutthrough_connection("too many headers");
817d9f57
JH
2801 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2802 log_write(0, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2803 "Too many \"Received\" headers",
2804 sender_address,
2805 (sender_fullhost == NULL)? "" : " H=",
2806 (sender_fullhost == NULL)? US"" : sender_fullhost,
2807 (sender_ident == NULL)? "" : " U=",
2808 (sender_ident == NULL)? US"" : sender_ident);
2809 message_id[0] = 0; /* Indicate no message accepted */
2810 smtp_reply = US"550 Too many \"Received\" headers - suspected mail loop";
2811 goto TIDYUP; /* Skip to end of function */
2812 }
e4bdf652
JH
2813 received_header_gen();
2814 add_acl_headers(US"MAIL or RCPT");
2815 (void) cutthrough_headers_send();
2816 }
817d9f57 2817
e4bdf652 2818
059ec3d9
PH
2819/* Open a new spool file for the data portion of the message. We need
2820to access it both via a file descriptor and a stream. Try to make the
2821directory if it isn't there. Note re use of sprintf: spool_directory
2822is checked on input to be < 200 characters long. */
2823
2824sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory, message_subdir,
2825 message_id);
2826data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2827if (data_fd < 0)
2828 {
2829 if (errno == ENOENT)
2830 {
2831 uschar temp[16];
2832 sprintf(CS temp, "input/%s", message_subdir);
2833 if (message_subdir[0] == 0) temp[5] = 0;
2834 (void)directory_make(spool_directory, temp, INPUT_DIRECTORY_MODE, TRUE);
2835 data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2836 }
2837 if (data_fd < 0)
2838 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Failed to create spool file %s: %s",
2839 spool_name, strerror(errno));
2840 }
2841
2842/* Make sure the file's group is the Exim gid, and double-check the mode
2843because the group setting doesn't always get set automatically. */
2844
1ac6b2e7
JH
2845if (fchown(data_fd, exim_uid, exim_gid))
2846 log_write(0, LOG_MAIN|LOG_PANIC_DIE,
2847 "Failed setting ownership on spool file %s: %s",
2848 spool_name, strerror(errno));
ff790e47 2849(void)fchmod(data_fd, SPOOL_MODE);
059ec3d9
PH
2850
2851/* We now have data file open. Build a stream for it and lock it. We lock only
2852the first line of the file (containing the message ID) because otherwise there
2853are problems when Exim is run under Cygwin (I'm told). See comments in
2854spool_in.c, where the same locking is done. */
2855
2856data_file = fdopen(data_fd, "w+");
2857lock_data.l_type = F_WRLCK;
2858lock_data.l_whence = SEEK_SET;
2859lock_data.l_start = 0;
2860lock_data.l_len = SPOOL_DATA_START_OFFSET;
2861
2862if (fcntl(data_fd, F_SETLK, &lock_data) < 0)
2863 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Cannot lock %s (%d): %s", spool_name,
2864 errno, strerror(errno));
2865
2866/* We have an open, locked data file. Write the message id to it to make it
2867self-identifying. Then read the remainder of the input of this message and
2868write it to the data file. If the variable next != NULL, it contains the first
2869data line (which was read as a header but then turned out not to have the right
2870format); write it (remembering that it might contain binary zeros). The result
2871of fwrite() isn't inspected; instead we call ferror() below. */
2872
2873fprintf(data_file, "%s-D\n", message_id);
2874if (next != NULL)
2875 {
2876 uschar *s = next->text;
2877 int len = next->slen;
1ac6b2e7 2878 len = fwrite(s, 1, len, data_file); len = len; /* compiler quietening */
059ec3d9
PH
2879 body_linecount++; /* Assumes only 1 line */
2880 }
2881
2882/* Note that we might already be at end of file, or the logical end of file
2883(indicated by '.'), or might have encountered an error while writing the
2884message id or "next" line. */
2885
2886if (!ferror(data_file) && !(receive_feof)() && message_ended != END_DOT)
2887 {
2888 if (smtp_input)
2889 {
2890 message_ended = read_message_data_smtp(data_file);
2891 receive_linecount++; /* The terminating "." line */
2892 }
2893 else message_ended = read_message_data(data_file);
2894
2895 receive_linecount += body_linecount; /* For BSMTP errors mainly */
2e0c1448 2896 message_linecount += body_linecount;
059ec3d9
PH
2897
2898 /* Handle premature termination of SMTP */
2899
2900 if (smtp_input && message_ended == END_EOF)
2901 {
2902 Uunlink(spool_name); /* Lose data file when closed */
2e5b33cd 2903 cancel_cutthrough_connection("sender closed connection");
059ec3d9
PH
2904 message_id[0] = 0; /* Indicate no message accepted */
2905 smtp_reply = handle_lost_connection(US"");
2906 smtp_yield = FALSE;
2907 goto TIDYUP; /* Skip to end of function */
2908 }
2909
2910 /* Handle message that is too big. Don't use host_or_ident() in the log
2911 message; we want to see the ident value even for non-remote messages. */
2912
2913 if (message_ended == END_SIZE)
2914 {
2915 Uunlink(spool_name); /* Lose the data file when closed */
2e5b33cd 2916 cancel_cutthrough_connection("mail too big");
059ec3d9
PH
2917 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2918
2919 log_write(L_size_reject, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2920 "message too big: read=%d max=%d",
2921 sender_address,
2922 (sender_fullhost == NULL)? "" : " H=",
2923 (sender_fullhost == NULL)? US"" : sender_fullhost,
2924 (sender_ident == NULL)? "" : " U=",
2925 (sender_ident == NULL)? US"" : sender_ident,
2926 message_size,
2927 thismessage_size_limit);
2928
2929 if (smtp_input)
2930 {
2931 smtp_reply = US"552 Message size exceeds maximum permitted";
2932 message_id[0] = 0; /* Indicate no message accepted */
2933 goto TIDYUP; /* Skip to end of function */
2934 }
2935 else
2936 {
2937 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2938 give_local_error(ERRMESS_TOOBIG,
2939 string_sprintf("message too big (max=%d)", thismessage_size_limit),
2940 US"message rejected: ", error_rc, data_file, header_list);
2941 /* Does not return */
2942 }
2943 }
2944 }
2945
2946/* Restore the standard SIGALRM handler for any subsequent processing. (For
2947example, there may be some expansion in an ACL that uses a timer.) */
2948
2949os_non_restarting_signal(SIGALRM, sigalrm_handler);
2950
2951/* The message body has now been read into the data file. Call fflush() to
2952empty the buffers in C, and then call fsync() to get the data written out onto
2953the disk, as fflush() doesn't do this (or at least, it isn't documented as
2954having to do this). If there was an I/O error on either input or output,
2955attempt to send an error message, and unlink the spool file. For non-SMTP input
2956we can then give up. Note that for SMTP input we must swallow the remainder of
2957the input in cases of output errors, since the far end doesn't expect to see
2958anything until the terminating dot line is sent. */
2959
2960if (fflush(data_file) == EOF || ferror(data_file) ||
54fc8428 2961 EXIMfsync(fileno(data_file)) < 0 || (receive_ferror)())
059ec3d9
PH
2962 {
2963 uschar *msg_errno = US strerror(errno);
2964 BOOL input_error = (receive_ferror)() != 0;
2965 uschar *msg = string_sprintf("%s error (%s) while receiving message from %s",
2966 input_error? "Input read" : "Spool write",
2967 msg_errno,
2968 (sender_fullhost != NULL)? sender_fullhost : sender_ident);
2969
2970 log_write(0, LOG_MAIN, "Message abandoned: %s", msg);
2971 Uunlink(spool_name); /* Lose the data file */
2e5b33cd 2972 cancel_cutthrough_connection("error writing spoolfile");
059ec3d9
PH
2973
2974 if (smtp_input)
2975 {
2976 if (input_error)
2977 smtp_reply = US"451 Error while reading input data";
2978 else
2979 {
2980 smtp_reply = US"451 Error while writing spool file";
2981 receive_swallow_smtp();
2982 }
2983 message_id[0] = 0; /* Indicate no message accepted */
2984 goto TIDYUP; /* Skip to end of function */
2985 }
2986
2987 else
2988 {
2989 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
2990 give_local_error(ERRMESS_IOERR, msg, US"", error_rc, data_file,
2991 header_list);
2992 /* Does not return */
2993 }
2994 }
2995
2996
2997/* No I/O errors were encountered while writing the data file. */
2998
2999DEBUG(D_receive) debug_printf("Data file written for message %s\n", message_id);
3000
3001
3002/* If there were any bad addresses extracted by -t, or there were no recipients
3003left after -t, send a message to the sender of this message, or write it to
3004stderr if the error handling option is set that way. Note that there may
3005legitimately be no recipients for an SMTP message if they have all been removed
3006by "discard".
3007
3008We need to rewind the data file in order to read it. In the case of no
3009recipients or stderr error writing, throw the data file away afterwards, and
3010exit. (This can't be SMTP, which always ensures there's at least one
3011syntactically good recipient address.) */
3012
3013if (extract_recip && (bad_addresses != NULL || recipients_count == 0))
3014 {
3015 DEBUG(D_receive)
3016 {
3017 if (recipients_count == 0) debug_printf("*** No recipients\n");
3018 if (bad_addresses != NULL)
3019 {
3020 error_block *eblock = bad_addresses;
3021 debug_printf("*** Bad address(es)\n");
3022 while (eblock != NULL)
3023 {
3024 debug_printf(" %s: %s\n", eblock->text1, eblock->text2);
3025 eblock = eblock->next;
3026 }
3027 }
3028 }
3029
3030 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3031
3032 /* If configured to send errors to the sender, but this fails, force
3033 a failure error code. We use a special one for no recipients so that it
3034 can be detected by the autoreply transport. Otherwise error_rc is set to
3035 errors_sender_rc, which is EXIT_FAILURE unless -oee was given, in which case
3036 it is EXIT_SUCCESS. */
3037
3038 if (error_handling == ERRORS_SENDER)
3039 {
3040 if (!moan_to_sender(
3041 (bad_addresses == NULL)?
3042 (extracted_ignored? ERRMESS_IGADDRESS : ERRMESS_NOADDRESS) :
3043 (recipients_list == NULL)? ERRMESS_BADNOADDRESS : ERRMESS_BADADDRESS,
3044 bad_addresses, header_list, data_file, FALSE))
3045 error_rc = (bad_addresses == NULL)? EXIT_NORECIPIENTS : EXIT_FAILURE;
3046 }
3047 else
3048 {
3049 if (bad_addresses == NULL)
3050 {
3051 if (extracted_ignored)
3052 fprintf(stderr, "exim: all -t recipients overridden by command line\n");
3053 else
3054 fprintf(stderr, "exim: no recipients in message\n");
3055 }
3056 else
3057 {
3058 fprintf(stderr, "exim: invalid address%s",
3059 (bad_addresses->next == NULL)? ":" : "es:\n");
3060 while (bad_addresses != NULL)
3061 {
3062 fprintf(stderr, " %s: %s\n", bad_addresses->text1,
3063 bad_addresses->text2);
3064 bad_addresses = bad_addresses->next;
3065 }
3066 }
3067 }
3068
3069 if (recipients_count == 0 || error_handling == ERRORS_STDERR)
3070 {
3071 Uunlink(spool_name);
f1e894f3 3072 (void)fclose(data_file);
059ec3d9
PH
3073 exim_exit(error_rc);
3074 }
3075 }
3076
3077/* Data file successfully written. Generate text for the Received: header by
3078expanding the configured string, and adding a timestamp. By leaving this
3079operation till now, we ensure that the timestamp is the time that message
3080reception was completed. However, this is deliberately done before calling the
3081data ACL and local_scan().
3082
3083This Received: header may therefore be inspected by the data ACL and by code in
3084the local_scan() function. When they have run, we update the timestamp to be
3085the final time of reception.
3086
3087If there is just one recipient, set up its value in the $received_for variable
3088for use when we generate the Received: header.
3089
3090Note: the checking for too many Received: headers is handled by the delivery
3091code. */
e4bdf652 3092/*XXX eventually add excess Received: check for cutthrough case back when classifying them */
059ec3d9 3093
e4bdf652 3094if (received_header->text == NULL) /* Non-cutthrough case */
059ec3d9 3095 {
e4bdf652 3096 received_header_gen();
059ec3d9 3097
e4bdf652 3098 /* Set the value of message_body_size for the DATA ACL and for local_scan() */
059ec3d9 3099
e4bdf652
JH
3100 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3101 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9 3102
e4bdf652
JH
3103 /* If an ACL from any RCPT commands set up any warning headers to add, do so
3104 now, before running the DATA ACL. */
059ec3d9 3105
e4bdf652
JH
3106 add_acl_headers(US"MAIL or RCPT");
3107 }
817d9f57 3108else
e4bdf652
JH
3109 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3110 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9
PH
3111
3112/* If an ACL is specified for checking things at this stage of reception of a
3113message, run it, unless all the recipients were removed by "discard" in earlier
3114ACLs. That is the only case in which recipients_count can be zero at this
3115stage. Set deliver_datafile to point to the data file so that $message_body and
3116$message_body_end can be extracted if needed. Allow $recipients in expansions.
3117*/
3118
3119deliver_datafile = data_fd;
4e88a19f 3120user_msg = NULL;
059ec3d9 3121
0e20aff9
MH
3122enable_dollar_recipients = TRUE;
3123
059ec3d9
PH
3124if (recipients_count == 0)
3125 {
3126 blackholed_by = recipients_discarded? US"MAIL ACL" : US"RCPT ACL";
3127 }
3128else
3129 {
059ec3d9
PH
3130 /* Handle interactive SMTP messages */
3131
3132 if (smtp_input && !smtp_batched_input)
3133 {
8523533c 3134
80a47a2c
TK
3135#ifndef DISABLE_DKIM
3136 if (!dkim_disable_verify)
3137 {
3138 /* Finish verification, this will log individual signature results to
3139 the mainlog */
3140 dkim_exim_verify_finish();
3141
3142 /* Check if we must run the DKIM ACL */
3143 if ((acl_smtp_dkim != NULL) &&
3144 (dkim_verify_signers != NULL) &&
3145 (dkim_verify_signers[0] != '\0'))
3146 {
3147 uschar *dkim_verify_signers_expanded =
3148 expand_string(dkim_verify_signers);
3149 if (dkim_verify_signers_expanded == NULL)
3150 {
3151 log_write(0, LOG_MAIN|LOG_PANIC,
3152 "expansion of dkim_verify_signers option failed: %s",
3153 expand_string_message);
3154 }
3155 else
3156 {
3157 int sep = 0;
3158 uschar *ptr = dkim_verify_signers_expanded;
3159 uschar *item = NULL;
9e5d6b55
TK
3160 uschar *seen_items = NULL;
3161 int seen_items_size = 0;
3162 int seen_items_offset = 0;
80a47a2c 3163 uschar itembuf[256];
9122af94
TK
3164 /* Default to OK when no items are present */
3165 rc = OK;
80a47a2c
TK
3166 while ((item = string_nextinlist(&ptr, &sep,
3167 itembuf,
3168 sizeof(itembuf))) != NULL)
3169 {
6119d1ea
TK
3170 /* Prevent running ACL for an empty item */
3171 if (!item || (item[0] == '\0')) continue;
9e5d6b55
TK
3172 /* Only run ACL once for each domain or identity, no matter how often it
3173 appears in the expanded list. */
6119d1ea
TK
3174 if (seen_items != NULL)
3175 {
ae9094bf
TK
3176 uschar *seen_item = NULL;
3177 uschar seen_item_buf[256];
4a73449b 3178 uschar *seen_items_list = seen_items;
ae9094bf
TK
3179 int seen_this_item = 0;
3180
3181 while ((seen_item = string_nextinlist(&seen_items_list, &sep,
3182 seen_item_buf,
3183 sizeof(seen_item_buf))) != NULL)
3184 {
3185 if (Ustrcmp(seen_item,item) == 0)
3186 {
3187 seen_this_item = 1;
3188 break;
3189 }
3190 }
3191
3192 if (seen_this_item > 0)
6119d1ea
TK
3193 {
3194 DEBUG(D_receive)
3195 debug_printf("acl_smtp_dkim: skipping signer %s, already seen\n", item);
3196 continue;
3197 }
ae9094bf 3198
4a73449b 3199 seen_items = string_append(seen_items,&seen_items_size,&seen_items_offset,1,":");
6119d1ea
TK
3200 }
3201
4a73449b
TK
3202 seen_items = string_append(seen_items,&seen_items_size,&seen_items_offset,1,item);
3203 seen_items[seen_items_offset] = '\0';
6119d1ea
TK
3204
3205 DEBUG(D_receive)
3206 debug_printf("calling acl_smtp_dkim for dkim_cur_signer=%s\n", item);
3207
80a47a2c
TK
3208 dkim_exim_acl_setup(item);
3209 rc = acl_check(ACL_WHERE_DKIM, NULL, acl_smtp_dkim, &user_msg, &log_msg);
6119d1ea
TK
3210
3211 if (rc != OK)
3212 {
3213 DEBUG(D_receive)
3214 debug_printf("acl_smtp_dkim: acl_check returned %d on %s, skipping remaining items\n", rc, item);
2e5b33cd 3215 cancel_cutthrough_connection("dkim acl not ok");
6119d1ea
TK
3216 break;
3217 }
80a47a2c
TK
3218 }
3219 add_acl_headers(US"DKIM");
3220 if (rc == DISCARD)
3221 {
3222 recipients_count = 0;
3223 blackholed_by = US"DKIM ACL";
3224 if (log_msg != NULL)
3225 blackhole_log_msg = string_sprintf(": %s", log_msg);
3226 }
3227 else if (rc != OK)
3228 {
3229 Uunlink(spool_name);
3230 if (smtp_handle_acl_fail(ACL_WHERE_DKIM, rc, user_msg, log_msg) != 0)
3231 smtp_yield = FALSE; /* No more messsages after dropped connection */
3232 smtp_reply = US""; /* Indicate reply already sent */
3233 message_id[0] = 0; /* Indicate no message accepted */
3234 goto TIDYUP; /* Skip to end of function */
3235 }
3236 }
3237 }
3238 }
3239#endif /* DISABLE_DKIM */
fb2274d4 3240
8523533c 3241#ifdef WITH_CONTENT_SCAN
80a47a2c
TK
3242 if (recipients_count > 0 &&
3243 acl_smtp_mime != NULL &&
54cdb463
PH
3244 !run_mime_acl(acl_smtp_mime, &smtp_yield, &smtp_reply, &blackholed_by))
3245 goto TIDYUP;
8523533c
TK
3246#endif /* WITH_CONTENT_SCAN */
3247
fd98a5c6
JH
3248#ifdef EXPERIMENTAL_PRDR
3249 if (prdr_requested && recipients_count > 1 && acl_smtp_data_prdr != NULL )
3250 {
3251 unsigned int c;
3252 int all_pass = OK;
3253 int all_fail = FAIL;
3254
3255 smtp_printf("353 PRDR content analysis beginning\r\n");
3256 /* Loop through recipients, responses must be in same order received */
3257 for (c = 0; recipients_count > c; c++)
3258 {
3259 uschar * addr= recipients_list[c].address;
3260 uschar * msg= US"PRDR R=<%s> %s";
3261 uschar * code;
3262 DEBUG(D_receive)
3263 debug_printf("PRDR processing recipient %s (%d of %d)\n",
3264 addr, c+1, recipients_count);
3265 rc = acl_check(ACL_WHERE_PRDR, addr,
3266 acl_smtp_data_prdr, &user_msg, &log_msg);
3267
3268 /* If any recipient rejected content, indicate it in final message */
3269 all_pass |= rc;
3270 /* If all recipients rejected, indicate in final message */
3271 all_fail &= rc;
3272
3273 switch (rc)
3274 {
3275 case OK: case DISCARD: code = US"250"; break;
3276 case DEFER: code = US"450"; break;
3277 default: code = US"550"; break;
3278 }
3279 if (user_msg != NULL)
3280 smtp_user_msg(code, user_msg);
3281 else
3282 {
3283 switch (rc)
3284 {
3285 case OK: case DISCARD:
3286 msg = string_sprintf(CS msg, addr, "acceptance"); break;
3287 case DEFER:
3288 msg = string_sprintf(CS msg, addr, "temporary refusal"); break;
3289 default:
3290 msg = string_sprintf(CS msg, addr, "refusal"); break;
3291 }
3292 smtp_user_msg(code, msg);
3293 }
3294 if (log_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, log_msg);
3295 else if (user_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, user_msg);
3296 else log_write(0, LOG_MAIN, CS msg);
3297
3298 if (rc != OK) { receive_remove_recipient(addr); c--; }
3299 }
3300 /* Set up final message, used if data acl gives OK */
3301 smtp_reply = string_sprintf("%s id=%s message %s",
3302 all_fail == FAIL ? US"550" : US"250",
3303 message_id,
3304 all_fail == FAIL
3305 ? US"rejected for all recipients"
3306 : all_pass == OK
3307 ? US"accepted"
3308 : US"accepted for some recipients");
3309 if (recipients_count == 0)
3310 {
3311 message_id[0] = 0; /* Indicate no message accepted */
3312 goto TIDYUP;
3313 }
3314 }
3315 else
3316 prdr_requested = FALSE;
3317#endif /* EXPERIMENTAL_PRDR */
3318
54cdb463
PH
3319 /* Check the recipients count again, as the MIME ACL might have changed
3320 them. */
8523533c 3321
059ec3d9
PH
3322 if (acl_smtp_data != NULL && recipients_count > 0)
3323 {
059ec3d9
PH
3324 rc = acl_check(ACL_WHERE_DATA, NULL, acl_smtp_data, &user_msg, &log_msg);
3325 add_acl_headers(US"DATA");
3326 if (rc == DISCARD)
3327 {
3328 recipients_count = 0;
3329 blackholed_by = US"DATA ACL";
8e669ac1
PH
3330 if (log_msg != NULL)
3331 blackhole_log_msg = string_sprintf(": %s", log_msg);
2e5b33cd 3332 cancel_cutthrough_connection("data acl discard");
059ec3d9
PH
3333 }
3334 else if (rc != OK)
3335 {
3336 Uunlink(spool_name);
2e5b33cd 3337 cancel_cutthrough_connection("data acl not ok");
8523533c
TK
3338#ifdef WITH_CONTENT_SCAN
3339 unspool_mbox();
3340#endif
6f0c431a
PP
3341#ifdef EXPERIMENTAL_DCC
3342 dcc_ok = 0;
3343#endif
059ec3d9
PH
3344 if (smtp_handle_acl_fail(ACL_WHERE_DATA, rc, user_msg, log_msg) != 0)
3345 smtp_yield = FALSE; /* No more messsages after dropped connection */
3346 smtp_reply = US""; /* Indicate reply already sent */
3347 message_id[0] = 0; /* Indicate no message accepted */
3348 goto TIDYUP; /* Skip to end of function */
3349 }
3350 }
3351 }
3352
3353 /* Handle non-SMTP and batch SMTP (i.e. non-interactive) messages. Note that
3354 we cannot take different actions for permanent and temporary rejections. */
3355
54cdb463 3356 else
059ec3d9 3357 {
54cdb463
PH
3358
3359#ifdef WITH_CONTENT_SCAN
3360 if (acl_not_smtp_mime != NULL &&
3361 !run_mime_acl(acl_not_smtp_mime, &smtp_yield, &smtp_reply,
3362 &blackholed_by))
3363 goto TIDYUP;
3364#endif /* WITH_CONTENT_SCAN */
3365
3366 if (acl_not_smtp != NULL)
059ec3d9 3367 {
54cdb463
PH
3368 uschar *user_msg, *log_msg;
3369 rc = acl_check(ACL_WHERE_NOTSMTP, NULL, acl_not_smtp, &user_msg, &log_msg);
3370 if (rc == DISCARD)
059ec3d9 3371 {
54cdb463
PH
3372 recipients_count = 0;
3373 blackholed_by = US"non-SMTP ACL";
3374 if (log_msg != NULL)
3375 blackhole_log_msg = string_sprintf(": %s", log_msg);
059ec3d9 3376 }
54cdb463 3377 else if (rc != OK)
059ec3d9 3378 {
54cdb463
PH
3379 Uunlink(spool_name);
3380#ifdef WITH_CONTENT_SCAN
3381 unspool_mbox();
3382#endif
6f0c431a
PP
3383#ifdef EXPERIMENTAL_DCC
3384 dcc_ok = 0;
3385#endif
6ea85e9a
PH
3386 /* The ACL can specify where rejections are to be logged, possibly
3387 nowhere. The default is main and reject logs. */
3388
3389 if (log_reject_target != 0)
3390 log_write(0, log_reject_target, "F=<%s> rejected by non-SMTP ACL: %s",
3391 sender_address, log_msg);
3392
54cdb463
PH
3393 if (user_msg == NULL) user_msg = US"local configuration problem";
3394 if (smtp_batched_input)
3395 {
3396 moan_smtp_batch(NULL, "%d %s", 550, user_msg);
3397 /* Does not return */
3398 }
3399 else
3400 {
3401 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3402 give_local_error(ERRMESS_LOCAL_ACL, user_msg,
3403 US"message rejected by non-SMTP ACL: ", error_rc, data_file,
3404 header_list);
3405 /* Does not return */
3406 }
059ec3d9 3407 }
54cdb463 3408 add_acl_headers(US"non-SMTP");
059ec3d9 3409 }
059ec3d9
PH
3410 }
3411
54cdb463
PH
3412 /* The applicable ACLs have been run */
3413
059ec3d9
PH
3414 if (deliver_freeze) frozen_by = US"ACL"; /* for later logging */
3415 if (queue_only_policy) queued_by = US"ACL";
059ec3d9
PH
3416 }
3417
8523533c
TK
3418#ifdef WITH_CONTENT_SCAN
3419unspool_mbox();
3420#endif
3421
6a8f9482
TK
3422#ifdef EXPERIMENTAL_DCC
3423dcc_ok = 0;
3424#endif
3425
3426
059ec3d9
PH
3427/* The final check on the message is to run the scan_local() function. The
3428version supplied with Exim always accepts, but this is a hook for sysadmins to
3429supply their own checking code. The local_scan() function is run even when all
3430the recipients have been discarded. */
3431
3432lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3433
3434/* Arrange to catch crashes in local_scan(), so that the -D file gets
3435deleted, and the incident gets logged. */
3436
3437os_non_restarting_signal(SIGSEGV, local_scan_crash_handler);
3438os_non_restarting_signal(SIGFPE, local_scan_crash_handler);
3439os_non_restarting_signal(SIGILL, local_scan_crash_handler);
3440os_non_restarting_signal(SIGBUS, local_scan_crash_handler);
3441
3442DEBUG(D_receive) debug_printf("calling local_scan(); timeout=%d\n",
3443 local_scan_timeout);
3444local_scan_data = NULL;
3445
3446os_non_restarting_signal(SIGALRM, local_scan_timeout_handler);
3447if (local_scan_timeout > 0) alarm(local_scan_timeout);
3448rc = local_scan(data_fd, &local_scan_data);
3449alarm(0);
3450os_non_restarting_signal(SIGALRM, sigalrm_handler);
3451
0e20aff9
MH
3452enable_dollar_recipients = FALSE;
3453
059ec3d9
PH
3454store_pool = POOL_MAIN; /* In case changed */
3455DEBUG(D_receive) debug_printf("local_scan() returned %d %s\n", rc,
3456 local_scan_data);
3457
3458os_non_restarting_signal(SIGSEGV, SIG_DFL);
3459os_non_restarting_signal(SIGFPE, SIG_DFL);
3460os_non_restarting_signal(SIGILL, SIG_DFL);
3461os_non_restarting_signal(SIGBUS, SIG_DFL);
3462
3463/* The length check is paranoia against some runaway code, and also because
3464(for a success return) lines in the spool file are read into big_buffer. */
3465
3466if (local_scan_data != NULL)
3467 {
3468 int len = Ustrlen(local_scan_data);
3469 if (len > LOCAL_SCAN_MAX_RETURN) len = LOCAL_SCAN_MAX_RETURN;
3470 local_scan_data = string_copyn(local_scan_data, len);
3471 }
3472
3473if (rc == LOCAL_SCAN_ACCEPT_FREEZE)
3474 {
58eb016e 3475 if (!deliver_freeze) /* ACL might have already frozen */
059ec3d9
PH
3476 {
3477 deliver_freeze = TRUE;
3478 deliver_frozen_at = time(NULL);
3479 frozen_by = US"local_scan()";
3480 }
3481 rc = LOCAL_SCAN_ACCEPT;
3482 }
3483else if (rc == LOCAL_SCAN_ACCEPT_QUEUE)
3484 {
3485 if (!queue_only_policy) /* ACL might have already queued */
3486 {
3487 queue_only_policy = TRUE;
3488 queued_by = US"local_scan()";
3489 }
3490 rc = LOCAL_SCAN_ACCEPT;
3491 }
3492
3493/* Message accepted: remove newlines in local_scan_data because otherwise
3494the spool file gets corrupted. Ensure that all recipients are qualified. */
3495
3496if (rc == LOCAL_SCAN_ACCEPT)
3497 {
3498 if (local_scan_data != NULL)
3499 {
3500 uschar *s;
3501 for (s = local_scan_data; *s != 0; s++) if (*s == '\n') *s = ' ';
3502 }
3503 for (i = 0; i < recipients_count; i++)
3504 {
3505 recipient_item *r = recipients_list + i;
3506 r->address = rewrite_address_qualify(r->address, TRUE);
3507 if (r->errors_to != NULL)
3508 r->errors_to = rewrite_address_qualify(r->errors_to, TRUE);
3509 }
3510 if (recipients_count == 0 && blackholed_by == NULL)
3511 blackholed_by = US"local_scan";
3512 }
3513
3514/* Message rejected: newlines permitted in local_scan_data to generate
3515multiline SMTP responses. */
3516
3517else
3518 {
3519 uschar *istemp = US"";
3520 uschar *s = NULL;
a5bd321b 3521 uschar *smtp_code;
059ec3d9
PH
3522 int size = 0;
3523 int sptr = 0;
059ec3d9
PH
3524
3525 errmsg = local_scan_data;
3526
3527 Uunlink(spool_name); /* Cancel this message */
3528 switch(rc)
3529 {
3530 default:
3531 log_write(0, LOG_MAIN, "invalid return %d from local_scan(). Temporary "
3532 "rejection given", rc);
3533 goto TEMPREJECT;
3534
3535 case LOCAL_SCAN_REJECT_NOLOGHDR:
3536 log_extra_selector &= ~LX_rejected_header;
3537 /* Fall through */
3538
3539 case LOCAL_SCAN_REJECT:
a5bd321b 3540 smtp_code = US"550";
059ec3d9
PH
3541 if (errmsg == NULL) errmsg = US"Administrative prohibition";
3542 break;
3543
3544 case LOCAL_SCAN_TEMPREJECT_NOLOGHDR:
3545 log_extra_selector &= ~LX_rejected_header;
3546 /* Fall through */
3547
3548 case LOCAL_SCAN_TEMPREJECT:
3549 TEMPREJECT:
a5bd321b 3550 smtp_code = US"451";
059ec3d9
PH
3551 if (errmsg == NULL) errmsg = US"Temporary local problem";
3552 istemp = US"temporarily ";
3553 break;
3554 }
3555
3556 s = string_append(s, &size, &sptr, 2, US"F=",
3557 (sender_address[0] == 0)? US"<>" : sender_address);
3558 s = add_host_info_for_log(s, &size, &sptr);
3559 s[sptr] = 0;
3560
3561 log_write(0, LOG_MAIN|LOG_REJECT, "%s %srejected by local_scan(): %.256s",
3562 s, istemp, string_printing(errmsg));
3563
3564 if (smtp_input)
3565 {
3566 if (!smtp_batched_input)
3567 {
a5bd321b 3568 smtp_respond(smtp_code, 3, TRUE, errmsg);
059ec3d9
PH
3569 message_id[0] = 0; /* Indicate no message accepted */
3570 smtp_reply = US""; /* Indicate reply already sent */
3571 goto TIDYUP; /* Skip to end of function */
3572 }
3573 else
3574 {
a5bd321b 3575 moan_smtp_batch(NULL, "%s %s", smtp_code, errmsg);
059ec3d9
PH
3576 /* Does not return */
3577 }
3578 }
3579 else
3580 {
3581 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3582 give_local_error(ERRMESS_LOCAL_SCAN, errmsg,
3583 US"message rejected by local scan code: ", error_rc, data_file,
3584 header_list);
3585 /* Does not return */
3586 }
3587 }
3588
3589/* Reset signal handlers to ignore signals that previously would have caused
3590the message to be abandoned. */
3591
3592signal(SIGTERM, SIG_IGN);
3593signal(SIGINT, SIG_IGN);
3594
e4bdf652 3595
059ec3d9
PH
3596/* Ensure the first time flag is set in the newly-received message. */
3597
3598deliver_firsttime = TRUE;
3599
8523533c
TK
3600#ifdef EXPERIMENTAL_BRIGHTMAIL
3601if (bmi_run == 1) {
3602 /* rewind data file */
3603 lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3604 bmi_verdicts = bmi_process_message(header_list, data_fd);
3605};
3606#endif
3607
059ec3d9
PH
3608/* Update the timstamp in our Received: header to account for any time taken by
3609an ACL or by local_scan(). The new time is the time that all reception
3610processing is complete. */
3611
3612timestamp = expand_string(US"${tod_full}");
3613tslen = Ustrlen(timestamp);
3614
3615memcpy(received_header->text + received_header->slen - tslen - 1,
3616 timestamp, tslen);
3617
3618/* In MUA wrapper mode, ignore queueing actions set by ACL or local_scan() */
3619
3620if (mua_wrapper)
3621 {
3622 deliver_freeze = FALSE;
3623 queue_only_policy = FALSE;
3624 }
3625
3626/* Keep the data file open until we have written the header file, in order to
3627hold onto the lock. In a -bh run, or if the message is to be blackholed, we
3628don't write the header file, and we unlink the data file. If writing the header
3629file fails, we have failed to accept this message. */
3630
3631if (host_checking || blackholed_by != NULL)
3632 {
3633 header_line *h;
3634 Uunlink(spool_name);
3635 msg_size = 0; /* Compute size for log line */
3636 for (h = header_list; h != NULL; h = h->next)
3637 if (h->type != '*') msg_size += h->slen;
3638 }
3639
3640/* Write the -H file */
3641
3642else
3643 {
3644 if ((msg_size = spool_write_header(message_id, SW_RECEIVING, &errmsg)) < 0)
3645 {
3646 log_write(0, LOG_MAIN, "Message abandoned: %s", errmsg);
3647 Uunlink(spool_name); /* Lose the data file */
3648
3649 if (smtp_input)
3650 {
3651 smtp_reply = US"451 Error in writing spool file";
3652 message_id[0] = 0; /* Indicate no message accepted */
3653 goto TIDYUP;
3654 }
3655 else
3656 {
3657 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3658 give_local_error(ERRMESS_IOERR, errmsg, US"", error_rc, data_file,
3659 header_list);
3660 /* Does not return */
3661 }
3662 }
3663 }
3664
3665
3666/* The message has now been successfully received. */
3667
3668receive_messagecount++;
3669
3670/* In SMTP sessions we may receive several in one connection. After each one,
3671we wait for the clock to tick at the level of message-id granularity. This is
3672so that the combination of time+pid is unique, even on systems where the pid
3673can be re-used within our time interval. We can't shorten the interval without
3674re-designing the message-id. See comments above where the message id is
3675created. This is Something For The Future. */
3676
3677message_id_tv.tv_usec = (message_id_tv.tv_usec/id_resolution) * id_resolution;
3678exim_wait_tick(&message_id_tv, id_resolution);
3679
3680/* Add data size to written header size. We do not count the initial file name
3681that is in the file, but we do add one extra for the notional blank line that
3682precedes the data. This total differs from message_size in that it include the
3683added Received: header and any other headers that got created locally. */
3684
3685fflush(data_file);
3686fstat(data_fd, &statbuf);
3687
3688msg_size += statbuf.st_size - SPOOL_DATA_START_OFFSET + 1;
3689
3690/* Generate a "message received" log entry. We do this by building up a dynamic
3691string as required. Since we commonly want to add two items at a time, use a
3692macro to simplify the coding. We log the arrival of a new message while the
3693file is still locked, just in case the machine is *really* fast, and delivers
3694it first! Include any message id that is in the message - since the syntax of a
3695message id is actually an addr-spec, we can use the parse routine to canonicize
3696it. */
3697
3698size = 256;
3699sptr = 0;
3700s = store_get(size);
3701
3702s = string_append(s, &size, &sptr, 2, US"<= ",
3703 (sender_address[0] == 0)? US"<>" : sender_address);
3704if (message_reference != NULL)
3705 s = string_append(s, &size, &sptr, 2, US" R=", message_reference);
3706
3707s = add_host_info_for_log(s, &size, &sptr);
3708
3709#ifdef SUPPORT_TLS
817d9f57
JH
3710if ((log_extra_selector & LX_tls_cipher) != 0 && tls_in.cipher != NULL)
3711 s = string_append(s, &size, &sptr, 2, US" X=", tls_in.cipher);
059ec3d9 3712if ((log_extra_selector & LX_tls_certificate_verified) != 0 &&
817d9f57 3713 tls_in.cipher != NULL)
059ec3d9 3714 s = string_append(s, &size, &sptr, 2, US" CV=",
817d9f57
JH
3715 tls_in.certificate_verified? "yes":"no");
3716if ((log_extra_selector & LX_tls_peerdn) != 0 && tls_in.peerdn != NULL)
48ed62d9 3717 s = string_append(s, &size, &sptr, 3, US" DN=\"",
817d9f57
JH
3718 string_printing(tls_in.peerdn), US"\"");
3719if ((log_extra_selector & LX_tls_sni) != 0 && tls_in.sni != NULL)
3f0945ff 3720 s = string_append(s, &size, &sptr, 3, US" SNI=\"",
817d9f57 3721 string_printing(tls_in.sni), US"\"");
3f0945ff 3722#endif
059ec3d9
PH
3723
3724if (sender_host_authenticated != NULL)
3725 {
3726 s = string_append(s, &size, &sptr, 2, US" A=", sender_host_authenticated);
3727 if (authenticated_id != NULL)
c8e2fc1e 3728 {
059ec3d9 3729 s = string_append(s, &size, &sptr, 2, US":", authenticated_id);
c8e2fc1e
JH
3730 if (log_extra_selector & LX_smtp_mailauth && authenticated_sender != NULL)
3731 s = string_append(s, &size, &sptr, 2, US":", authenticated_sender);
3732 }
059ec3d9
PH
3733 }
3734
fd98a5c6
JH
3735#ifdef EXPERIMENTAL_PRDR
3736if (prdr_requested)
3737 s = string_append(s, &size, &sptr, 1, US" PRDR");
3738#endif
3739
059ec3d9
PH
3740sprintf(CS big_buffer, "%d", msg_size);
3741s = string_append(s, &size, &sptr, 2, US" S=", big_buffer);
3742
3c0a92dc
JH
3743/* log 8BITMIME mode announced in MAIL_FROM
3744 0 ... no BODY= used
3745 7 ... 7BIT
3746 8 ... 8BITMIME */
c8e2fc1e
JH
3747if (log_extra_selector & LX_8bitmime)
3748 {
3c0a92dc
JH
3749 sprintf(CS big_buffer, "%d", body_8bitmime);
3750 s = string_append(s, &size, &sptr, 2, US" M8S=", big_buffer);
c8e2fc1e 3751 }
3c0a92dc 3752
059ec3d9
PH
3753/* If an addr-spec in a message-id contains a quoted string, it can contain
3754any characters except " \ and CR and so in particular it can contain NL!
3755Therefore, make sure we use a printing-characters only version for the log.
3756Also, allow for domain literals in the message id. */
3757
3758if (msgid_header != NULL)
3759 {
3760 uschar *old_id;
3761 BOOL save_allow_domain_literals = allow_domain_literals;
3762 allow_domain_literals = TRUE;
3763 old_id = parse_extract_address(Ustrchr(msgid_header->text, ':') + 1,
3764 &errmsg, &start, &end, &domain, FALSE);
3765 allow_domain_literals = save_allow_domain_literals;
3766 if (old_id != NULL)
3767 s = string_append(s, &size, &sptr, 2, US" id=", string_printing(old_id));
3768 }
3769
3770/* If subject logging is turned on, create suitable printing-character
3771text. By expanding $h_subject: we make use of the MIME decoding. */
3772
3773if ((log_extra_selector & LX_subject) != 0 && subject_header != NULL)
3774 {
3775 int i;
3776 uschar *p = big_buffer;
3777 uschar *ss = expand_string(US"$h_subject:");
3778
3779 /* Backslash-quote any double quotes or backslashes so as to make a
3780 a C-like string, and turn any non-printers into escape sequences. */
3781
3782 *p++ = '\"';
3783 if (*ss != 0) for (i = 0; i < 100 && ss[i] != 0; i++)
3784 {
3785 if (ss[i] == '\"' || ss[i] == '\\') *p++ = '\\';
3786 *p++ = ss[i];
3787 }
3788 *p++ = '\"';
3789 *p = 0;
3790 s = string_append(s, &size, &sptr, 2, US" T=", string_printing(big_buffer));
3791 }
3792
3793/* Terminate the string: string_cat() and string_append() leave room, but do
3794not put the zero in. */
3795
3796s[sptr] = 0;
3797
059ec3d9
PH
3798/* Create a message log file if message logs are being used and this message is
3799not blackholed. Write the reception stuff to it. We used to leave message log
e4bdf652 3800creation until the first delivery, but this has proved confusing for some
059ec3d9
PH
3801people. */
3802
3803if (message_logs && blackholed_by == NULL)
3804 {
3805 int fd;
3806
3807 sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory, message_subdir,
3808 message_id);
3809 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3810
3811 if (fd < 0 && errno == ENOENT)
3812 {
3813 uschar temp[16];
3814 sprintf(CS temp, "msglog/%s", message_subdir);
3815 if (message_subdir[0] == 0) temp[6] = 0;
3816 (void)directory_make(spool_directory, temp, MSGLOG_DIRECTORY_MODE, TRUE);
3817 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);