Testsuite: Add DKIM Chunking test
[exim.git] / src / src / receive.c
CommitLineData
059ec3d9
PH
1/*************************************************
2* Exim - an Internet mail transport agent *
3*************************************************/
4
80fea873 5/* Copyright (c) University of Cambridge 1995 - 2016 */
059ec3d9
PH
6/* See the file NOTICE for conditions of use and distribution. */
7
8/* Code for receiving a message and setting up spool files. */
9
059ec3d9
PH
10#include "exim.h"
11
6a8f9482
TK
12#ifdef EXPERIMENTAL_DCC
13extern int dcc_ok;
14#endif
15
4840604e 16#ifdef EXPERIMENTAL_DMARC
c007c974 17# include "dmarc.h"
4840604e
TL
18#endif /* EXPERIMENTAL_DMARC */
19
059ec3d9
PH
20/*************************************************
21* Local static variables *
22*************************************************/
23
24static FILE *data_file = NULL;
25static int data_fd = -1;
41313d92 26static uschar *spool_name = US"";
059ec3d9
PH
27
28
29
30/*************************************************
31* Non-SMTP character reading functions *
32*************************************************/
33
34/* These are the default functions that are set up in the variables such as
35receive_getc initially. They just call the standard functions, passing stdin as
36the file. (When SMTP input is occurring, different functions are used by
37changing the pointer variables.) */
38
39int
40stdin_getc(void)
41{
42return getc(stdin);
43}
44
45int
46stdin_ungetc(int c)
47{
48return ungetc(c, stdin);
49}
50
51int
52stdin_feof(void)
53{
54return feof(stdin);
55}
56
57int
58stdin_ferror(void)
59{
60return ferror(stdin);
61}
62
63
64
65
66/*************************************************
67* Check that a set sender is allowed *
68*************************************************/
69
70/* This function is called when a local caller sets an explicit sender address.
71It checks whether this is permitted, which it is for trusted callers.
72Otherwise, it must match the pattern(s) in untrusted_set_sender.
73
74Arguments: the proposed sender address
75Returns: TRUE for a trusted caller
76 TRUE if the address has been set, untrusted_set_sender has been
77 set, and the address matches something in the list
78 FALSE otherwise
79*/
80
81BOOL
82receive_check_set_sender(uschar *newsender)
83{
84uschar *qnewsender;
85if (trusted_caller) return TRUE;
86if (newsender == NULL || untrusted_set_sender == NULL) return FALSE;
87qnewsender = (Ustrchr(newsender, '@') != NULL)?
88 newsender : string_sprintf("%s@%s", newsender, qualify_domain_sender);
89return
55414b25 90 match_address_list(qnewsender, TRUE, TRUE, CUSS &untrusted_set_sender, NULL, -1,
059ec3d9
PH
91 0, NULL) == OK;
92}
93
94
95
96
97/*************************************************
5cb8cbc6 98* Read space info for a partition *
059ec3d9
PH
99*************************************************/
100
8e669ac1
PH
101/* This function is called by receive_check_fs() below, and also by string
102expansion for variables such as $spool_space. The field names for the statvfs
5cb8cbc6
PH
103structure are macros, because not all OS have F_FAVAIL and it seems tidier to
104have macros for F_BAVAIL and F_FILES as well. Some kinds of file system do not
105have inodes, and they return -1 for the number available.
059ec3d9 106
5cb8cbc6
PH
107Later: It turns out that some file systems that do not have the concept of
108inodes return 0 rather than -1. Such systems should also return 0 for the total
8e669ac1 109number of inodes, so we require that to be greater than zero before returning
5cb8cbc6 110an inode count.
059ec3d9 111
5cb8cbc6
PH
112Arguments:
113 isspool TRUE for spool partition, FALSE for log partition
114 inodeptr address of int to receive inode count; -1 if there isn't one
8e669ac1 115
5cb8cbc6 116Returns: available on-root space, in kilobytes
8e669ac1
PH
117 -1 for log partition if there isn't one
118
119All values are -1 if the STATFS functions are not available.
059ec3d9
PH
120*/
121
8e669ac1 122int
5cb8cbc6 123receive_statvfs(BOOL isspool, int *inodeptr)
059ec3d9
PH
124{
125#ifdef HAVE_STATFS
059ec3d9 126struct STATVFS statbuf;
ddf1b11a 127struct stat dummy;
5cb8cbc6
PH
128uschar *path;
129uschar *name;
130uschar buffer[1024];
059ec3d9 131
5cb8cbc6 132/* The spool directory must always exist. */
059ec3d9 133
5cb8cbc6 134if (isspool)
059ec3d9 135 {
8e669ac1
PH
136 path = spool_directory;
137 name = US"spool";
138 }
139
059ec3d9
PH
140/* Need to cut down the log file path to the directory, and to ignore any
141appearance of "syslog" in it. */
142
5cb8cbc6 143else
059ec3d9 144 {
059ec3d9 145 int sep = ':'; /* Not variable - outside scripts use */
55414b25 146 const uschar *p = log_file_path;
8e669ac1 147 name = US"log";
059ec3d9
PH
148
149 /* An empty log_file_path means "use the default". This is the same as an
150 empty item in a list. */
151
152 if (*p == 0) p = US":";
55414b25
JH
153 while ((path = string_nextinlist(&p, &sep, buffer, sizeof(buffer))))
154 if (Ustrcmp(path, "syslog") != 0)
155 break;
059ec3d9 156
5cb8cbc6
PH
157 if (path == NULL) /* No log files */
158 {
8e669ac1
PH
159 *inodeptr = -1;
160 return -1;
161 }
059ec3d9 162
8e669ac1
PH
163 /* An empty string means use the default, which is in the spool directory.
164 But don't just use the spool directory, as it is possible that the log
5cb8cbc6 165 subdirectory has been symbolically linked elsewhere. */
059ec3d9 166
8e669ac1 167 if (path[0] == 0)
059ec3d9 168 {
5cb8cbc6
PH
169 sprintf(CS buffer, CS"%s/log", CS spool_directory);
170 path = buffer;
8e669ac1
PH
171 }
172 else
059ec3d9 173 {
8e669ac1 174 uschar *cp;
5cb8cbc6 175 if ((cp = Ustrrchr(path, '/')) != NULL) *cp = 0;
8e669ac1 176 }
5cb8cbc6 177 }
8e669ac1 178
8f128379 179/* We now have the path; do the business */
5cb8cbc6
PH
180
181memset(&statbuf, 0, sizeof(statbuf));
182
183if (STATVFS(CS path, &statbuf) != 0)
ddf1b11a
JH
184 if (stat(CS path, &dummy) == -1 && errno == ENOENT)
185 { /* Can happen on first run after installation */
186 *inodeptr = -1;
187 return -1;
188 }
189 else
190 {
191 log_write(0, LOG_MAIN|LOG_PANIC, "cannot accept message: failed to stat "
192 "%s directory %s: %s", name, path, strerror(errno));
193 smtp_closedown(US"spool or log directory problem");
194 exim_exit(EXIT_FAILURE);
195 }
8e669ac1 196
5cb8cbc6
PH
197*inodeptr = (statbuf.F_FILES > 0)? statbuf.F_FAVAIL : -1;
198
199/* Disks are getting huge. Take care with computing the size in kilobytes. */
8e669ac1 200
5cb8cbc6
PH
201return (int)(((double)statbuf.F_BAVAIL * (double)statbuf.F_FRSIZE)/1024.0);
202
ddf1b11a 203#else
5cb8cbc6
PH
204/* Unable to find partition sizes in this environment. */
205
5cb8cbc6
PH
206*inodeptr = -1;
207return -1;
208#endif
209}
210
059ec3d9 211
059ec3d9 212
5cb8cbc6
PH
213
214/*************************************************
215* Check space on spool and log partitions *
216*************************************************/
217
218/* This function is called before accepting a message; if any thresholds are
219set, it checks them. If a message_size is supplied, it checks that there is
220enough space for that size plus the threshold - i.e. that the message won't
221reduce the space to the threshold. Not all OS have statvfs(); for those that
222don't, this function always returns TRUE. For some OS the old function and
223struct name statfs is used; that is handled by a macro, defined in exim.h.
224
225Arguments:
226 msg_size the (estimated) size of an incoming message
227
228Returns: FALSE if there isn't enough space, or if the information cannot
229 be obtained
230 TRUE if no check was done or there is enough space
231*/
232
233BOOL
234receive_check_fs(int msg_size)
235{
236int space, inodes;
237
238if (check_spool_space > 0 || msg_size > 0 || check_spool_inodes > 0)
239 {
8e669ac1
PH
240 space = receive_statvfs(TRUE, &inodes);
241
059ec3d9 242 DEBUG(D_receive)
5cb8cbc6
PH
243 debug_printf("spool directory space = %dK inodes = %d "
244 "check_space = %dK inodes = %d msg_size = %d\n",
245 space, inodes, check_spool_space, check_spool_inodes, msg_size);
8e669ac1
PH
246
247 if ((space >= 0 && space < check_spool_space) ||
5cb8cbc6 248 (inodes >= 0 && inodes < check_spool_inodes))
8e669ac1 249 {
5cb8cbc6
PH
250 log_write(0, LOG_MAIN, "spool directory space check failed: space=%d "
251 "inodes=%d", space, inodes);
059ec3d9
PH
252 return FALSE;
253 }
254 }
255
5cb8cbc6
PH
256if (check_log_space > 0 || check_log_inodes > 0)
257 {
8e669ac1
PH
258 space = receive_statvfs(FALSE, &inodes);
259
5cb8cbc6
PH
260 DEBUG(D_receive)
261 debug_printf("log directory space = %dK inodes = %d "
262 "check_space = %dK inodes = %d\n",
263 space, inodes, check_log_space, check_log_inodes);
8e669ac1
PH
264
265 if ((space >= 0 && space < check_log_space) ||
5cb8cbc6 266 (inodes >= 0 && inodes < check_log_inodes))
8e669ac1 267 {
5cb8cbc6
PH
268 log_write(0, LOG_MAIN, "log directory space check failed: space=%d "
269 "inodes=%d", space, inodes);
270 return FALSE;
271 }
8e669ac1
PH
272 }
273
059ec3d9
PH
274return TRUE;
275}
276
277
278
279/*************************************************
280* Bomb out while reading a message *
281*************************************************/
282
283/* The common case of wanting to bomb out is if a SIGTERM or SIGINT is
284received, or if there is a timeout. A rarer case might be if the log files are
285screwed up and Exim can't open them to record a message's arrival. Handling
286that case is done by setting a flag to cause the log functions to call this
287function if there is an ultimate disaster. That is why it is globally
288accessible.
289
8f128379
PH
290Arguments:
291 reason text reason to pass to the not-quit ACL
292 msg default SMTP response to give if in an SMTP session
059ec3d9
PH
293Returns: it doesn't
294*/
295
296void
8f128379 297receive_bomb_out(uschar *reason, uschar *msg)
059ec3d9 298{
ead37e6c
PP
299 static BOOL already_bombing_out;
300/* The smtp_notquit_exit() below can call ACLs which can trigger recursive
301timeouts, if someone has something slow in their quit ACL. Since the only
302things we should be doing are to close down cleanly ASAP, on the second
303pass we also close down stuff that might be opened again, before bypassing
304the ACL call and exiting. */
305
059ec3d9
PH
306/* If spool_name is set, it contains the name of the data file that is being
307written. Unlink it before closing so that it cannot be picked up by a delivery
308process. Ensure that any header file is also removed. */
309
ead37e6c 310if (spool_name[0] != '\0')
059ec3d9
PH
311 {
312 Uunlink(spool_name);
313 spool_name[Ustrlen(spool_name) - 1] = 'H';
314 Uunlink(spool_name);
ead37e6c 315 spool_name[0] = '\0';
059ec3d9
PH
316 }
317
318/* Now close the file if it is open, either as a fd or a stream. */
319
ead37e6c
PP
320if (data_file != NULL)
321 {
322 (void)fclose(data_file);
323 data_file = NULL;
324} else if (data_fd >= 0) {
325 (void)close(data_fd);
326 data_fd = -1;
327 }
059ec3d9 328
8f128379
PH
329/* Attempt to close down an SMTP connection tidily. For non-batched SMTP, call
330smtp_notquit_exit(), which runs the NOTQUIT ACL, if present, and handles the
331SMTP response. */
059ec3d9 332
ead37e6c 333if (!already_bombing_out)
059ec3d9 334 {
ead37e6c
PP
335 already_bombing_out = TRUE;
336 if (smtp_input)
337 {
338 if (smtp_batched_input)
339 moan_smtp_batch(NULL, "421 %s - message abandoned", msg); /* No return */
340 smtp_notquit_exit(reason, US"421", US"%s %s - closing connection.",
341 smtp_active_hostname, msg);
342 }
059ec3d9
PH
343 }
344
345/* Exit from the program (non-BSMTP cases) */
346
347exim_exit(EXIT_FAILURE);
348}
349
350
351/*************************************************
352* Data read timeout *
353*************************************************/
354
355/* Handler function for timeouts that occur while reading the data that
356comprises a message.
357
358Argument: the signal number
359Returns: nothing
360*/
361
362static void
363data_timeout_handler(int sig)
364{
365uschar *msg = NULL;
366
367sig = sig; /* Keep picky compilers happy */
368
369if (smtp_input)
370 {
371 msg = US"SMTP incoming data timeout";
372 log_write(L_lost_incoming_connection,
373 LOG_MAIN, "SMTP data timeout (message abandoned) on connection "
fed77020
PH
374 "from %s F=<%s>",
375 (sender_fullhost != NULL)? sender_fullhost : US"local process",
376 sender_address);
059ec3d9
PH
377 }
378else
379 {
380 fprintf(stderr, "exim: timed out while reading - message abandoned\n");
381 log_write(L_lost_incoming_connection,
382 LOG_MAIN, "timed out while reading local message");
383 }
384
8f128379 385receive_bomb_out(US"data-timeout", msg); /* Does not return */
059ec3d9
PH
386}
387
388
389
390/*************************************************
391* local_scan() timeout *
392*************************************************/
393
394/* Handler function for timeouts that occur while running a local_scan()
395function.
396
397Argument: the signal number
398Returns: nothing
399*/
400
401static void
402local_scan_timeout_handler(int sig)
403{
404sig = sig; /* Keep picky compilers happy */
405log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function timed out - "
406 "message temporarily rejected (size %d)", message_size);
8f128379
PH
407/* Does not return */
408receive_bomb_out(US"local-scan-timeout", US"local verification problem");
059ec3d9
PH
409}
410
411
412
413/*************************************************
414* local_scan() crashed *
415*************************************************/
416
417/* Handler function for signals that occur while running a local_scan()
418function.
419
420Argument: the signal number
421Returns: nothing
422*/
423
424static void
425local_scan_crash_handler(int sig)
426{
427log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function crashed with "
428 "signal %d - message temporarily rejected (size %d)", sig, message_size);
8f128379
PH
429/* Does not return */
430receive_bomb_out(US"local-scan-error", US"local verification problem");
059ec3d9
PH
431}
432
433
434/*************************************************
435* SIGTERM or SIGINT received *
436*************************************************/
437
438/* Handler for SIGTERM or SIGINT signals that occur while reading the
439data that comprises a message.
440
441Argument: the signal number
442Returns: nothing
443*/
444
445static void
446data_sigterm_sigint_handler(int sig)
447{
448uschar *msg = NULL;
449
450if (smtp_input)
451 {
452 msg = US"Service not available - SIGTERM or SIGINT received";
453 log_write(0, LOG_MAIN, "%s closed after %s", smtp_get_connection_info(),
454 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
455 }
456else
457 {
f05da2e8 458 if (filter_test == FTEST_NONE)
059ec3d9
PH
459 {
460 fprintf(stderr, "\nexim: %s received - message abandoned\n",
461 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
462 log_write(0, LOG_MAIN, "%s received while reading local message",
463 (sig == SIGTERM)? "SIGTERM" : "SIGINT");
464 }
465 }
466
8f128379 467receive_bomb_out(US"signal-exit", msg); /* Does not return */
059ec3d9
PH
468}
469
470
471
472/*************************************************
473* Add new recipient to list *
474*************************************************/
475
476/* This function builds a list of recipient addresses in argc/argv
477format.
478
479Arguments:
480 recipient the next address to add to recipients_list
481 pno parent number for fixed aliases; -1 otherwise
482
483Returns: nothing
484*/
485
486void
487receive_add_recipient(uschar *recipient, int pno)
488{
489if (recipients_count >= recipients_list_max)
490 {
491 recipient_item *oldlist = recipients_list;
492 int oldmax = recipients_list_max;
493 recipients_list_max = recipients_list_max? 2*recipients_list_max : 50;
494 recipients_list = store_get(recipients_list_max * sizeof(recipient_item));
495 if (oldlist != NULL)
496 memcpy(recipients_list, oldlist, oldmax * sizeof(recipient_item));
497 }
498
499recipients_list[recipients_count].address = recipient;
500recipients_list[recipients_count].pno = pno;
8523533c
TK
501#ifdef EXPERIMENTAL_BRIGHTMAIL
502recipients_list[recipients_count].bmi_optin = bmi_current_optin;
503/* reset optin string pointer for next recipient */
504bmi_current_optin = NULL;
505#endif
6c1c3d1d
WB
506recipients_list[recipients_count].orcpt = NULL;
507recipients_list[recipients_count].dsn_flags = 0;
059ec3d9
PH
508recipients_list[recipients_count++].errors_to = NULL;
509}
510
511
512
513
fd98a5c6
JH
514/*************************************************
515* Send user response message *
516*************************************************/
61147df4 517
fd98a5c6
JH
518/* This function is passed a default response code and a user message. It calls
519smtp_message_code() to check and possibly modify the response code, and then
520calls smtp_respond() to transmit the response. I put this into a function
521just to avoid a lot of repetition.
61147df4
PP
522
523Arguments:
fd98a5c6
JH
524 code the response code
525 user_msg the user message
526
527Returns: nothing
61147df4
PP
528*/
529
8ccd00b1 530#ifndef DISABLE_PRDR
61147df4 531static void
fd98a5c6 532smtp_user_msg(uschar *code, uschar *user_msg)
61147df4 533{
fd98a5c6 534int len = 3;
4f6ae5c3 535smtp_message_code(&code, &len, &user_msg, NULL, TRUE);
fd98a5c6 536smtp_respond(code, len, TRUE, user_msg);
61147df4
PP
537}
538#endif
539
540
541
542
fd98a5c6 543
059ec3d9
PH
544/*************************************************
545* Remove a recipient from the list *
546*************************************************/
547
548/* This function is provided for local_scan() to use.
549
550Argument:
551 recipient address to remove
552
553Returns: TRUE if it did remove something; FALSE otherwise
554*/
555
556BOOL
557receive_remove_recipient(uschar *recipient)
558{
559int count;
560DEBUG(D_receive) debug_printf("receive_remove_recipient(\"%s\") called\n",
561 recipient);
562for (count = 0; count < recipients_count; count++)
563 {
564 if (Ustrcmp(recipients_list[count].address, recipient) == 0)
565 {
566 if ((--recipients_count - count) > 0)
567 memmove(recipients_list + count, recipients_list + count + 1,
54cdb463 568 (recipients_count - count)*sizeof(recipient_item));
059ec3d9
PH
569 return TRUE;
570 }
571 }
572return FALSE;
573}
574
575
576
577
578
579/*************************************************
580* Read data portion of a non-SMTP message *
581*************************************************/
582
583/* This function is called to read the remainder of a message (following the
584header) when the input is not from SMTP - we are receiving a local message on
585a standard input stream. The message is always terminated by EOF, and is also
586terminated by a dot on a line by itself if the flag dot_ends is TRUE. Split the
587two cases for maximum efficiency.
588
589Ensure that the body ends with a newline. This will naturally be the case when
590the termination is "\n.\n" but may not be otherwise. The RFC defines messages
591as "sequences of lines" - this of course strictly applies only to SMTP, but
592deliveries into BSD-type mailbox files also require it. Exim used to have a
593flag for doing this at delivery time, but as it was always set for all
594transports, I decided to simplify things by putting the check here instead.
595
596There is at least one MUA (dtmail) that sends CRLF via this interface, and
597other programs are known to do this as well. Exim used to have a option for
598dealing with this: in July 2003, after much discussion, the code has been
599changed to default to treat any of LF, CRLF, and bare CR as line terminators.
600
601However, for the case when a dot on a line by itself terminates a message, the
602only recognized terminating sequences before and after the dot are LF and CRLF.
603Otherwise, having read EOL . CR, you don't know whether to read another
604character or not.
605
606Internally, in messages stored in Exim's spool files, LF is used as the line
607terminator. Under the new regime, bare CRs will no longer appear in these
608files.
609
610Arguments:
611 fout a FILE to which to write the message
612
613Returns: One of the END_xxx values indicating why it stopped reading
614*/
615
616static int
617read_message_data(FILE *fout)
618{
619int ch_state;
620register int ch;
d677b2f2 621register int linelength = 0;
059ec3d9
PH
622
623/* Handle the case when only EOF terminates the message */
624
625if (!dot_ends)
626 {
627 register int last_ch = '\n';
628
80a47a2c 629 for (; (ch = (receive_getc)()) != EOF; last_ch = ch)
059ec3d9
PH
630 {
631 if (ch == 0) body_zerocount++;
632 if (last_ch == '\r' && ch != '\n')
633 {
d677b2f2
PH
634 if (linelength > max_received_linelength)
635 max_received_linelength = linelength;
636 linelength = 0;
059ec3d9
PH
637 if (fputc('\n', fout) == EOF) return END_WERROR;
638 message_size++;
639 body_linecount++;
640 }
641 if (ch == '\r') continue;
642
643 if (fputc(ch, fout) == EOF) return END_WERROR;
d677b2f2
PH
644 if (ch == '\n')
645 {
646 if (linelength > max_received_linelength)
647 max_received_linelength = linelength;
648 linelength = 0;
649 body_linecount++;
650 }
651 else linelength++;
059ec3d9
PH
652 if (++message_size > thismessage_size_limit) return END_SIZE;
653 }
654
655 if (last_ch != '\n')
656 {
d677b2f2
PH
657 if (linelength > max_received_linelength)
658 max_received_linelength = linelength;
059ec3d9
PH
659 if (fputc('\n', fout) == EOF) return END_WERROR;
660 message_size++;
661 body_linecount++;
662 }
663
664 return END_EOF;
665 }
666
667/* Handle the case when a dot on a line on its own, or EOF, terminates. */
668
669ch_state = 1;
670
80a47a2c 671while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
672 {
673 if (ch == 0) body_zerocount++;
674 switch (ch_state)
675 {
676 case 0: /* Normal state (previous char written) */
677 if (ch == '\n')
d677b2f2
PH
678 {
679 body_linecount++;
680 if (linelength > max_received_linelength)
681 max_received_linelength = linelength;
682 linelength = -1;
683 ch_state = 1;
684 }
059ec3d9
PH
685 else if (ch == '\r')
686 { ch_state = 2; continue; }
687 break;
688
689 case 1: /* After written "\n" */
690 if (ch == '.') { ch_state = 3; continue; }
6eb02f88 691 if (ch == '\r') { ch_state = 2; continue; }
3581f321
JH
692 if (ch == '\n') { body_linecount++; linelength = -1; }
693 else ch_state = 0;
059ec3d9
PH
694 break;
695
696 case 2:
697 body_linecount++; /* After unwritten "\r" */
d677b2f2
PH
698 if (linelength > max_received_linelength)
699 max_received_linelength = linelength;
059ec3d9 700 if (ch == '\n')
d677b2f2
PH
701 {
702 ch_state = 1;
703 linelength = -1;
704 }
059ec3d9
PH
705 else
706 {
707 if (message_size++, fputc('\n', fout) == EOF) return END_WERROR;
708 if (ch == '\r') continue;
709 ch_state = 0;
d677b2f2 710 linelength = 0;
059ec3d9
PH
711 }
712 break;
713
714 case 3: /* After "\n." (\n written, dot not) */
715 if (ch == '\n') return END_DOT;
716 if (ch == '\r') { ch_state = 4; continue; }
717 message_size++;
d677b2f2 718 linelength++;
059ec3d9
PH
719 if (fputc('.', fout) == EOF) return END_WERROR;
720 ch_state = 0;
721 break;
722
723 case 4: /* After "\n.\r" (\n written, rest not) */
724 if (ch == '\n') return END_DOT;
725 message_size += 2;
726 body_linecount++;
727 if (fputs(".\n", fout) == EOF) return END_WERROR;
728 if (ch == '\r') { ch_state = 2; continue; }
729 ch_state = 0;
730 break;
731 }
732
d677b2f2 733 linelength++;
059ec3d9
PH
734 if (fputc(ch, fout) == EOF) return END_WERROR;
735 if (++message_size > thismessage_size_limit) return END_SIZE;
736 }
737
738/* Get here if EOF read. Unless we have just written "\n", we need to ensure
739the message ends with a newline, and we must also write any characters that
740were saved up while testing for an ending dot. */
741
742if (ch_state != 1)
743 {
744 static uschar *ends[] = { US"\n", NULL, US"\n", US".\n", US".\n" };
745 if (fputs(CS ends[ch_state], fout) == EOF) return END_WERROR;
746 message_size += Ustrlen(ends[ch_state]);
747 body_linecount++;
748 }
749
750return END_EOF;
751}
752
753
754
755
756/*************************************************
757* Read data portion of an SMTP message *
758*************************************************/
759
760/* This function is called to read the remainder of an SMTP message (after the
761headers), or to skip over it when an error has occurred. In this case, the
762output file is passed as NULL.
763
764If any line begins with a dot, that character is skipped. The input should only
765be successfully terminated by CR LF . CR LF unless it is local (non-network)
766SMTP, in which case the CRs are optional, but...
767
768FUDGE: It seems that sites on the net send out messages with just LF
769terminators, despite the warnings in the RFCs, and other MTAs handle this. So
770we make the CRs optional in all cases.
771
772July 2003: Bare CRs cause trouble. We now treat them as line terminators as
773well, so that there are no CRs in spooled messages. However, the message
774terminating dot is not recognized between two bare CRs.
775
776Arguments:
777 fout a FILE to which to write the message; NULL if skipping
778
779Returns: One of the END_xxx values indicating why it stopped reading
780*/
781
782static int
783read_message_data_smtp(FILE *fout)
784{
785int ch_state = 0;
e4bdf652 786int ch;
7e3ce68e 787int linelength = 0;
059ec3d9 788
80a47a2c 789while ((ch = (receive_getc)()) != EOF)
059ec3d9
PH
790 {
791 if (ch == 0) body_zerocount++;
792 switch (ch_state)
793 {
794 case 0: /* After LF or CRLF */
795 if (ch == '.')
796 {
797 ch_state = 3;
798 continue; /* Don't ever write . after LF */
799 }
800 ch_state = 1;
801
802 /* Else fall through to handle as normal uschar. */
803
804 case 1: /* Normal state */
805 if (ch == '\n')
806 {
807 ch_state = 0;
808 body_linecount++;
1f5497b2
PH
809 if (linelength > max_received_linelength)
810 max_received_linelength = linelength;
811 linelength = -1;
059ec3d9
PH
812 }
813 else if (ch == '\r')
814 {
815 ch_state = 2;
816 continue;
817 }
818 break;
819
820 case 2: /* After (unwritten) CR */
821 body_linecount++;
1f5497b2
PH
822 if (linelength > max_received_linelength)
823 max_received_linelength = linelength;
824 linelength = -1;
059ec3d9
PH
825 if (ch == '\n')
826 {
827 ch_state = 0;
828 }
829 else
830 {
831 message_size++;
832 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 833 (void) cutthrough_put_nl();
059ec3d9
PH
834 if (ch != '\r') ch_state = 1; else continue;
835 }
836 break;
837
838 case 3: /* After [CR] LF . */
839 if (ch == '\n')
840 return END_DOT;
841 if (ch == '\r')
842 {
843 ch_state = 4;
844 continue;
845 }
1bc460a6
JH
846 /* The dot was removed at state 3. For a doubled dot, here, reinstate
847 it to cutthrough. The current ch, dot or not, is passed both to cutthrough
848 and to file below. */
849 if (ch == '.')
850 {
851 uschar c= ch;
852 (void) cutthrough_puts(&c, 1);
853 }
854 ch_state = 1;
059ec3d9
PH
855 break;
856
857 case 4: /* After [CR] LF . CR */
858 if (ch == '\n') return END_DOT;
859 message_size++;
860 body_linecount++;
861 if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR;
e4bdf652 862 (void) cutthrough_put_nl();
059ec3d9
PH
863 if (ch == '\r')
864 {
865 ch_state = 2;
866 continue;
867 }
868 ch_state = 1;
869 break;
870 }
871
872 /* Add the character to the spool file, unless skipping; then loop for the
873 next. */
874
875 message_size++;
1f5497b2 876 linelength++;
7e3ce68e 877 if (fout)
059ec3d9
PH
878 {
879 if (fputc(ch, fout) == EOF) return END_WERROR;
880 if (message_size > thismessage_size_limit) return END_SIZE;
881 }
e4bdf652
JH
882 if(ch == '\n')
883 (void) cutthrough_put_nl();
884 else
885 {
7e3ce68e 886 uschar c = ch;
e4bdf652
JH
887 (void) cutthrough_puts(&c, 1);
888 }
059ec3d9
PH
889 }
890
891/* Fall through here if EOF encountered. This indicates some kind of error,
892since a correct message is terminated by [CR] LF . [CR] LF. */
893
894return END_EOF;
895}
896
897
898
899
7e3ce68e
JH
900/* Variant of the above read_message_data_smtp() specialised for RFC 3030
901CHUNKING. We assume that the incoming has proper CRLF, so only have to scan
902for and strip CR. On the downside there are more protocol reasons to stop.
903
904Arguments:
905 fout a FILE to which to write the message; NULL if skipping
906
907Returns: One of the END_xxx values indicating why it stopped reading
908*/
909
910static int
911read_message_bdat_smtp(FILE *fout)
912{
913int ch;
914int linelength = 0;
915
916for (;;) switch (ch = bdat_getc())
917 {
918 case EOF: return END_EOF;
919 case EOD: return END_DOT;
920 case ERR: return END_PROTOCOL;
921
922 case '\r':
923 body_linecount++;
924 if (linelength > max_received_linelength)
925 max_received_linelength = linelength;
926 linelength = -1;
927 break;
928
929 case 0:
930 body_zerocount++;
931 /*FALLTHROUGH*/
932 default:
933 message_size++;
934 linelength++;
935 if (fout)
936 {
937 if (fputc(ch, fout) == EOF) return END_WERROR;
938 if (message_size > thismessage_size_limit) return END_SIZE;
939 }
940#ifdef notyet
941 if(ch == '\n')
942 (void) cutthrough_put_nl();
943 else
944 {
945 uschar c = ch;
946 (void) cutthrough_puts(&c, 1);
947 }
948#endif
949 break;
950 }
951/*NOTREACHED*/
952}
953
954
955
956
059ec3d9
PH
957/*************************************************
958* Swallow SMTP message *
959*************************************************/
960
961/* This function is called when there has been some kind of error while reading
962an SMTP message, and the remaining data may need to be swallowed. It is global
963because it is called from smtp_closedown() to shut down an incoming call
964tidily.
965
966Argument: a FILE from which to read the message
967Returns: nothing
968*/
969
970void
971receive_swallow_smtp(void)
972{
7e3ce68e 973/*XXX CHUNKING: not enough. read chunks until RSET? */
059ec3d9
PH
974if (message_ended >= END_NOTENDED)
975 message_ended = read_message_data_smtp(NULL);
976}
977
978
979
980/*************************************************
981* Handle lost SMTP connection *
982*************************************************/
983
984/* This function logs connection loss incidents and generates an appropriate
985SMTP response.
986
987Argument: additional data for the message
988Returns: the SMTP response
989*/
990
991static uschar *
992handle_lost_connection(uschar *s)
993{
994log_write(L_lost_incoming_connection | L_smtp_connection, LOG_MAIN,
995 "%s lost while reading message data%s", smtp_get_connection_info(), s);
eea0defe 996smtp_notquit_exit(US"connection-lost", NULL, NULL);
059ec3d9
PH
997return US"421 Lost incoming connection";
998}
999
1000
1001
1002
1003/*************************************************
1004* Handle a non-smtp reception error *
1005*************************************************/
1006
1007/* This function is called for various errors during the reception of non-SMTP
1008messages. It either sends a message to the sender of the problem message, or it
1009writes to the standard error stream.
1010
1011Arguments:
1012 errcode code for moan_to_sender(), identifying the error
1013 text1 first message text, passed to moan_to_sender()
1014 text2 second message text, used only for stderrr
1015 error_rc code to pass to exim_exit if no problem
1016 f FILE containing body of message (may be stdin)
1017 hptr pointer to instore headers or NULL
1018
1019Returns: calls exim_exit(), which does not return
1020*/
1021
1022static void
1023give_local_error(int errcode, uschar *text1, uschar *text2, int error_rc,
1024 FILE *f, header_line *hptr)
1025{
1026if (error_handling == ERRORS_SENDER)
1027 {
1028 error_block eblock;
1029 eblock.next = NULL;
1030 eblock.text1 = text1;
37f3dc43 1031 eblock.text2 = US"";
059ec3d9
PH
1032 if (!moan_to_sender(errcode, &eblock, hptr, f, FALSE))
1033 error_rc = EXIT_FAILURE;
1034 }
37f3dc43
JH
1035else
1036 fprintf(stderr, "exim: %s%s\n", text2, text1); /* Sic */
f1e894f3 1037(void)fclose(f);
059ec3d9
PH
1038exim_exit(error_rc);
1039}
1040
1041
1042
1043/*************************************************
1044* Add header lines set up by ACL *
1045*************************************************/
1046
850635b6
PH
1047/* This function is called to add the header lines that were set up by
1048statements in an ACL to the list of headers in memory. It is done in two stages
1049like this, because when the ACL for RCPT is running, the other headers have not
1050yet been received. This function is called twice; once just before running the
1051DATA ACL, and once after. This is so that header lines added by MAIL or RCPT
1052are visible to the DATA ACL.
059ec3d9
PH
1053
1054Originally these header lines were added at the end. Now there is support for
1055three different places: top, bottom, and after the Received: header(s). There
1056will always be at least one Received: header, even if it is marked deleted, and
1057even if something else has been put in front of it.
1058
1059Arguments:
1060 acl_name text to identify which ACL
1061
1062Returns: nothing
1063*/
1064
1065static void
578d43dc 1066add_acl_headers(int where, uschar *acl_name)
059ec3d9
PH
1067{
1068header_line *h, *next;
1069header_line *last_received = NULL;
e7568d51 1070
578d43dc
JH
1071switch(where)
1072 {
1073 case ACL_WHERE_DKIM:
1074 case ACL_WHERE_MIME:
af4a1bca 1075 case ACL_WHERE_DATA:
5032d1cf 1076 if (cutthrough.fd >= 0 && (acl_removed_headers || acl_added_headers))
578d43dc
JH
1077 {
1078 log_write(0, LOG_MAIN|LOG_PANIC, "Header modification in data ACLs"
af4a1bca 1079 " will not take effect on cutthrough deliveries");
578d43dc
JH
1080 return;
1081 }
1082 }
1083
e7568d51
TL
1084if (acl_removed_headers != NULL)
1085 {
1086 DEBUG(D_receive|D_acl) debug_printf(">>Headers removed by %s ACL:\n", acl_name);
1087
4a142059 1088 for (h = header_list; h != NULL; h = h->next) if (h->type != htype_old)
e7568d51 1089 {
55414b25 1090 const uschar * list = acl_removed_headers;
e7568d51
TL
1091 int sep = ':'; /* This is specified as a colon-separated list */
1092 uschar *s;
1093 uschar buffer[128];
4a142059
JH
1094
1095 while ((s = string_nextinlist(&list, &sep, buffer, sizeof(buffer))))
1096 if (header_testname(h, s, Ustrlen(s), FALSE))
e7568d51
TL
1097 {
1098 h->type = htype_old;
1099 DEBUG(D_receive|D_acl) debug_printf(" %s", h->text);
1100 }
e7568d51
TL
1101 }
1102 acl_removed_headers = NULL;
1103 DEBUG(D_receive|D_acl) debug_printf(">>\n");
1104 }
059ec3d9 1105
71fafd95 1106if (acl_added_headers == NULL) return;
059ec3d9
PH
1107DEBUG(D_receive|D_acl) debug_printf(">>Headers added by %s ACL:\n", acl_name);
1108
71fafd95 1109for (h = acl_added_headers; h != NULL; h = next)
059ec3d9
PH
1110 {
1111 next = h->next;
1112
1113 switch(h->type)
1114 {
1115 case htype_add_top:
1116 h->next = header_list;
1117 header_list = h;
1118 DEBUG(D_receive|D_acl) debug_printf(" (at top)");
1119 break;
1120
1121 case htype_add_rec:
1122 if (last_received == NULL)
1123 {
1124 last_received = header_list;
1125 while (!header_testname(last_received, US"Received", 8, FALSE))
1126 last_received = last_received->next;
1127 while (last_received->next != NULL &&
1128 header_testname(last_received->next, US"Received", 8, FALSE))
1129 last_received = last_received->next;
1130 }
1131 h->next = last_received->next;
1132 last_received->next = h;
1133 DEBUG(D_receive|D_acl) debug_printf(" (after Received:)");
1134 break;
1135
8523533c
TK
1136 case htype_add_rfc:
1137 /* add header before any header which is NOT Received: or Resent- */
1138 last_received = header_list;
1139 while ( (last_received->next != NULL) &&
1140 ( (header_testname(last_received->next, US"Received", 8, FALSE)) ||
1141 (header_testname_incomplete(last_received->next, US"Resent-", 7, FALSE)) ) )
1142 last_received = last_received->next;
1143 /* last_received now points to the last Received: or Resent-* header
1144 in an uninterrupted chain of those header types (seen from the beginning
1145 of all headers. Our current header must follow it. */
1146 h->next = last_received->next;
1147 last_received->next = h;
8e669ac1 1148 DEBUG(D_receive|D_acl) debug_printf(" (before any non-Received: or Resent-*: header)");
8523533c
TK
1149 break;
1150
059ec3d9
PH
1151 default:
1152 h->next = NULL;
1153 header_last->next = h;
1154 break;
1155 }
1156
1157 if (h->next == NULL) header_last = h;
1158
1159 /* Check for one of the known header types (From:, To:, etc.) though in
1160 practice most added headers are going to be "other". Lower case
1161 identification letters are never stored with the header; they are used
1162 for existence tests when messages are received. So discard any lower case
1163 flag values. */
1164
1165 h->type = header_checkname(h, FALSE);
1166 if (h->type >= 'a') h->type = htype_other;
1167
1168 DEBUG(D_receive|D_acl) debug_printf(" %s", header_last->text);
1169 }
1170
71fafd95 1171acl_added_headers = NULL;
059ec3d9
PH
1172DEBUG(D_receive|D_acl) debug_printf(">>\n");
1173}
1174
1175
1176
1177/*************************************************
1178* Add host information for log line *
1179*************************************************/
1180
1181/* Called for acceptance and rejecting log lines. This adds information about
1182the calling host to a string that is being built dynamically.
1183
1184Arguments:
1185 s the dynamic string
1186 sizeptr points to the size variable
1187 ptrptr points to the pointer variable
1188
1189Returns: the extended string
1190*/
1191
1192static uschar *
fc16abb4 1193add_host_info_for_log(uschar * s, int * sizeptr, int * ptrptr)
059ec3d9 1194{
fc16abb4 1195if (sender_fullhost)
059ec3d9 1196 {
fc16abb4
JH
1197 if (LOGGING(dnssec) && sender_host_dnssec) /*XXX sender_helo_dnssec? */
1198 s = string_cat(s, sizeptr, ptrptr, US" DS");
059ec3d9 1199 s = string_append(s, sizeptr, ptrptr, 2, US" H=", sender_fullhost);
6c6d6e48 1200 if (LOGGING(incoming_interface) && interface_address != NULL)
059ec3d9 1201 {
fc16abb4
JH
1202 s = string_cat(s, sizeptr, ptrptr,
1203 string_sprintf(" I=[%s]:%d", interface_address, interface_port));
059ec3d9
PH
1204 }
1205 }
1206if (sender_ident != NULL)
1207 s = string_append(s, sizeptr, ptrptr, 2, US" U=", sender_ident);
1208if (received_protocol != NULL)
1209 s = string_append(s, sizeptr, ptrptr, 2, US" P=", received_protocol);
1210return s;
1211}
1212
1213
1214
63955bf2 1215#ifdef WITH_CONTENT_SCAN
059ec3d9 1216
54cdb463
PH
1217/*************************************************
1218* Run the MIME ACL on a message *
1219*************************************************/
1220
1221/* This code is in a subroutine so that it can be used for both SMTP
1222and non-SMTP messages. It is called with a non-NULL ACL pointer.
1223
1224Arguments:
1225 acl The ACL to run (acl_smtp_mime or acl_not_smtp_mime)
1226 smtp_yield_ptr Set FALSE to kill messages after dropped connection
1227 smtp_reply_ptr Where SMTP reply is being built
1228 blackholed_by_ptr Where "blackholed by" message is being built
1229
1230Returns: TRUE to carry on; FALSE to abandon the message
1231*/
1232
1233static BOOL
1234run_mime_acl(uschar *acl, BOOL *smtp_yield_ptr, uschar **smtp_reply_ptr,
1235 uschar **blackholed_by_ptr)
1236{
1237FILE *mbox_file;
1238uschar rfc822_file_path[2048];
1239unsigned long mbox_size;
1240header_line *my_headerlist;
1241uschar *user_msg, *log_msg;
1242int mime_part_count_buffer = -1;
7156b1ef 1243int rc = OK;
54cdb463
PH
1244
1245memset(CS rfc822_file_path,0,2048);
1246
1247/* check if it is a MIME message */
1248my_headerlist = header_list;
4e88a19f
PH
1249while (my_headerlist != NULL)
1250 {
54cdb463 1251 /* skip deleted headers */
4e88a19f
PH
1252 if (my_headerlist->type == '*')
1253 {
54cdb463
PH
1254 my_headerlist = my_headerlist->next;
1255 continue;
4e88a19f
PH
1256 }
1257 if (strncmpic(my_headerlist->text, US"Content-Type:", 13) == 0)
1258 {
54cdb463
PH
1259 DEBUG(D_receive) debug_printf("Found Content-Type: header - executing acl_smtp_mime.\n");
1260 goto DO_MIME_ACL;
4e88a19f 1261 }
54cdb463 1262 my_headerlist = my_headerlist->next;
4e88a19f 1263 }
54cdb463
PH
1264
1265DEBUG(D_receive) debug_printf("No Content-Type: header - presumably not a MIME message.\n");
1266return TRUE;
1267
1268DO_MIME_ACL:
1269/* make sure the eml mbox file is spooled up */
8544e77a 1270mbox_file = spool_mbox(&mbox_size, NULL);
54cdb463
PH
1271if (mbox_file == NULL) {
1272 /* error while spooling */
1273 log_write(0, LOG_MAIN|LOG_PANIC,
1274 "acl_smtp_mime: error while creating mbox spool file, message temporarily rejected.");
1275 Uunlink(spool_name);
1276 unspool_mbox();
6f0c431a
PP
1277#ifdef EXPERIMENTAL_DCC
1278 dcc_ok = 0;
1279#endif
a5bd321b 1280 smtp_respond(US"451", 3, TRUE, US"temporary local problem");
54cdb463
PH
1281 message_id[0] = 0; /* Indicate no message accepted */
1282 *smtp_reply_ptr = US""; /* Indicate reply already sent */
1283 return FALSE; /* Indicate skip to end of receive function */
1284};
1285
1286mime_is_rfc822 = 0;
1287
1288MIME_ACL_CHECK:
1289mime_part_count = -1;
1290rc = mime_acl_check(acl, mbox_file, NULL, &user_msg, &log_msg);
f1e894f3 1291(void)fclose(mbox_file);
54cdb463 1292
4e88a19f
PH
1293if (Ustrlen(rfc822_file_path) > 0)
1294 {
54cdb463
PH
1295 mime_part_count = mime_part_count_buffer;
1296
4e88a19f
PH
1297 if (unlink(CS rfc822_file_path) == -1)
1298 {
54cdb463
PH
1299 log_write(0, LOG_PANIC,
1300 "acl_smtp_mime: can't unlink RFC822 spool file, skipping.");
1301 goto END_MIME_ACL;
4e88a19f
PH
1302 }
1303 }
54cdb463
PH
1304
1305/* check if we must check any message/rfc822 attachments */
4e88a19f
PH
1306if (rc == OK)
1307 {
54cdb463 1308 uschar temp_path[1024];
e8bc7fca
JH
1309 struct dirent * entry;
1310 DIR * tempdir;
54cdb463 1311
e8bc7fca
JH
1312 (void) string_format(temp_path, sizeof(temp_path), "%s/scan/%s",
1313 spool_directory, message_id);
54cdb463 1314
4e88a19f 1315 tempdir = opendir(CS temp_path);
e8bc7fca 1316 for (;;)
4e88a19f 1317 {
e8bc7fca
JH
1318 if (!(entry = readdir(tempdir)))
1319 break;
1320 if (strncmpic(US entry->d_name, US"__rfc822_", 9) == 0)
4e88a19f 1321 {
e8bc7fca
JH
1322 (void) string_format(rfc822_file_path, sizeof(rfc822_file_path),
1323 "%s/scan/%s/%s", spool_directory, message_id, entry->d_name);
1324 debug_printf("RFC822 attachment detected: running MIME ACL for '%s'\n",
1325 rfc822_file_path);
4e88a19f
PH
1326 break;
1327 }
e8bc7fca 1328 }
4e88a19f 1329 closedir(tempdir);
54cdb463 1330
e8bc7fca 1331 if (entry)
4e88a19f 1332 {
e8bc7fca 1333 if ((mbox_file = Ufopen(rfc822_file_path, "rb")))
4e88a19f 1334 {
e8bc7fca
JH
1335 /* set RFC822 expansion variable */
1336 mime_is_rfc822 = 1;
1337 mime_part_count_buffer = mime_part_count;
1338 goto MIME_ACL_CHECK;
4e88a19f 1339 }
e8bc7fca
JH
1340 log_write(0, LOG_PANIC,
1341 "acl_smtp_mime: can't open RFC822 spool file, skipping.");
1342 unlink(CS rfc822_file_path);
4e88a19f
PH
1343 }
1344 }
54cdb463
PH
1345
1346END_MIME_ACL:
578d43dc 1347add_acl_headers(ACL_WHERE_MIME, US"MIME");
54cdb463
PH
1348if (rc == DISCARD)
1349 {
1350 recipients_count = 0;
1351 *blackholed_by_ptr = US"MIME ACL";
1352 }
1353else if (rc != OK)
1354 {
1355 Uunlink(spool_name);
1356 unspool_mbox();
6f0c431a
PP
1357#ifdef EXPERIMENTAL_DCC
1358 dcc_ok = 0;
1359#endif
4f6ae5c3
JH
1360 if ( smtp_input
1361 && smtp_handle_acl_fail(ACL_WHERE_MIME, rc, user_msg, log_msg) != 0)
1362 {
85ffcba6 1363 *smtp_yield_ptr = FALSE; /* No more messages after dropped connection */
f4c1088b 1364 *smtp_reply_ptr = US""; /* Indicate reply already sent */
4f6ae5c3 1365 }
54cdb463
PH
1366 message_id[0] = 0; /* Indicate no message accepted */
1367 return FALSE; /* Cause skip to end of receive function */
4e88a19f 1368 }
54cdb463
PH
1369
1370return TRUE;
1371}
1372
63955bf2 1373#endif /* WITH_CONTENT_SCAN */
54cdb463
PH
1374
1375
e4bdf652
JH
1376
1377void
1378received_header_gen(void)
1379{
1380uschar *received;
1381uschar *timestamp;
1382header_line *received_header= header_list;
1383
1384timestamp = expand_string(US"${tod_full}");
1385if (recipients_count == 1) received_for = recipients_list[0].address;
1386received = expand_string(received_header_text);
1387received_for = NULL;
1388
d4ff61d1 1389if (!received)
e4bdf652
JH
1390 {
1391 if(spool_name[0] != 0)
1392 Uunlink(spool_name); /* Lose the data file */
1393 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Expansion of \"%s\" "
1394 "(received_header_text) failed: %s", string_printing(received_header_text),
1395 expand_string_message);
1396 }
1397
1398/* The first element on the header chain is reserved for the Received header,
1399so all we have to do is fill in the text pointer, and set the type. However, if
1400the result of the expansion is an empty string, we leave the header marked as
1401"old" so as to refrain from adding a Received header. */
1402
1403if (received[0] == 0)
1404 {
1405 received_header->text = string_sprintf("Received: ; %s\n", timestamp);
1406 received_header->type = htype_old;
1407 }
1408else
1409 {
1410 received_header->text = string_sprintf("%s; %s\n", received, timestamp);
1411 received_header->type = htype_received;
1412 }
1413
1414received_header->slen = Ustrlen(received_header->text);
1415
1416DEBUG(D_receive) debug_printf(">>Generated Received: header line\n%c %s",
1417 received_header->type, received_header->text);
1418}
1419
1420
1421
059ec3d9
PH
1422/*************************************************
1423* Receive message *
1424*************************************************/
1425
1426/* Receive a message on the given input, and put it into a pair of spool files.
1427Either a non-null list of recipients, or the extract flag will be true, or
1428both. The flag sender_local is true for locally generated messages. The flag
1429submission_mode is true if an ACL has obeyed "control = submission". The flag
8800895a 1430suppress_local_fixups is true if an ACL has obeyed "control =
f4ee74ac
PP
1431suppress_local_fixups" or -G was passed on the command-line.
1432The flag smtp_input is true if the message is to be
8800895a
PH
1433handled using SMTP conventions about termination and lines starting with dots.
1434For non-SMTP messages, dot_ends is true for dot-terminated messages.
059ec3d9
PH
1435
1436If a message was successfully read, message_id[0] will be non-zero.
1437
1438The general actions of this function are:
1439
1440 . Read the headers of the message (if any) into a chain of store
1441 blocks.
1442
1443 . If there is a "sender:" header and the message is locally originated,
69358f02
PH
1444 throw it away, unless the caller is trusted, or unless
1445 active_local_sender_retain is set - which can only happen if
1446 active_local_from_check is false.
059ec3d9
PH
1447
1448 . If recipients are to be extracted from the message, build the
1449 recipients list from the headers, removing any that were on the
1450 original recipients list (unless extract_addresses_remove_arguments is
1451 false), and at the same time, remove any bcc header that may be present.
1452
1453 . Get the spool file for the data, sort out its unique name, open
1454 and lock it (but don't give it the name yet).
1455
1456 . Generate a "Message-Id" header if the message doesn't have one, for
1457 locally-originated messages.
1458
1459 . Generate a "Received" header.
1460
1461 . Ensure the recipients list is fully qualified and rewritten if necessary.
1462
1463 . If there are any rewriting rules, apply them to the sender address
1464 and also to the headers.
1465
1466 . If there is no from: header, generate one, for locally-generated messages
1467 and messages in "submission mode" only.
1468
1469 . If the sender is local, check that from: is correct, and if not, generate
1470 a Sender: header, unless message comes from a trusted caller, or this
69358f02 1471 feature is disabled by active_local_from_check being false.
059ec3d9
PH
1472
1473 . If there is no "date" header, generate one, for locally-originated
1474 or submission mode messages only.
1475
1476 . Copy the rest of the input, or up to a terminating "." if in SMTP or
1477 dot_ends mode, to the data file. Leave it open, to hold the lock.
1478
1479 . Write the envelope and the headers to a new file.
1480
1481 . Set the name for the header file; close it.
1482
1483 . Set the name for the data file; close it.
1484
1485Because this function can potentially be called many times in a single
1486SMTP connection, all store should be got by store_get(), so that it will be
1487automatically retrieved after the message is accepted.
1488
1489FUDGE: It seems that sites on the net send out messages with just LF
1490terminators, despite the warnings in the RFCs, and other MTAs handle this. So
1491we make the CRs optional in all cases.
1492
1493July 2003: Bare CRs in messages, especially in header lines, cause trouble. A
1494new regime is now in place in which bare CRs in header lines are turned into LF
1495followed by a space, so as not to terminate the header line.
1496
1497February 2004: A bare LF in a header line in a message whose first line was
1498terminated by CRLF is treated in the same way as a bare CR.
1499
1500Arguments:
1501 extract_recip TRUE if recipients are to be extracted from the message's
1502 headers
1503
1504Returns: TRUE there are more messages to be read (SMTP input)
1505 FALSE there are no more messages to be read (non-SMTP input
1506 or SMTP connection collapsed, or other failure)
1507
1508When reading a message for filter testing, the returned value indicates
1509whether the headers (which is all that is read) were terminated by '.' or
1510not. */
1511
1512BOOL
1513receive_msg(BOOL extract_recip)
1514{
7156b1ef
NM
1515int i;
1516int rc = FAIL;
059ec3d9
PH
1517int msg_size = 0;
1518int process_info_len = Ustrlen(process_info);
1519int error_rc = (error_handling == ERRORS_SENDER)?
1520 errors_sender_rc : EXIT_FAILURE;
1521int header_size = 256;
1522int start, end, domain, size, sptr;
1523int id_resolution;
1524int had_zero = 0;
d677b2f2 1525int prevlines_length = 0;
059ec3d9
PH
1526
1527register int ptr = 0;
1528
1529BOOL contains_resent_headers = FALSE;
1530BOOL extracted_ignored = FALSE;
1531BOOL first_line_ended_crlf = TRUE_UNSET;
1532BOOL smtp_yield = TRUE;
1533BOOL yield = FALSE;
1534
1535BOOL resents_exist = FALSE;
1536uschar *resent_prefix = US"";
1537uschar *blackholed_by = NULL;
04f7d5b9 1538uschar *blackhole_log_msg = US"";
c5430c20 1539enum {NOT_TRIED, TMP_REJ, PERM_REJ, ACCEPTED} cutthrough_done = NOT_TRIED;
059ec3d9
PH
1540
1541flock_t lock_data;
1542error_block *bad_addresses = NULL;
1543
1544uschar *frozen_by = NULL;
1545uschar *queued_by = NULL;
1546
1547uschar *errmsg, *s;
1548struct stat statbuf;
1549
4e88a19f 1550/* Final message to give to SMTP caller, and messages from ACLs */
059ec3d9
PH
1551
1552uschar *smtp_reply = NULL;
4e88a19f 1553uschar *user_msg, *log_msg;
059ec3d9
PH
1554
1555/* Working header pointers */
1556
1557header_line *h, *next;
1558
2cbb4081 1559/* Flags for noting the existence of certain headers (only one left) */
059ec3d9
PH
1560
1561BOOL date_header_exists = FALSE;
1562
1563/* Pointers to receive the addresses of headers whose contents we need. */
1564
1565header_line *from_header = NULL;
1566header_line *subject_header = NULL;
1567header_line *msgid_header = NULL;
1568header_line *received_header;
1569
4840604e
TL
1570#ifdef EXPERIMENTAL_DMARC
1571int dmarc_up = 0;
1572#endif /* EXPERIMENTAL_DMARC */
1573
059ec3d9
PH
1574/* Variables for use when building the Received: header. */
1575
059ec3d9
PH
1576uschar *timestamp;
1577int tslen;
1578
1579/* Release any open files that might have been cached while preparing to
1580accept the message - e.g. by verifying addresses - because reading a message
1581might take a fair bit of real time. */
1582
1583search_tidyup();
1584
e4bdf652
JH
1585/* Extracting the recipient list from an input file is incompatible with
1586cutthrough delivery with the no-spool option. It shouldn't be possible
817d9f57 1587to set up the combination, but just in case kill any ongoing connection. */
e4bdf652 1588if (extract_recip || !smtp_input)
2e5b33cd 1589 cancel_cutthrough_connection("not smtp input");
e4bdf652 1590
059ec3d9
PH
1591/* Initialize the chain of headers by setting up a place-holder for Received:
1592header. Temporarily mark it as "old", i.e. not to be used. We keep header_last
1593pointing to the end of the chain to make adding headers simple. */
1594
1595received_header = header_list = header_last = store_get(sizeof(header_line));
1596header_list->next = NULL;
1597header_list->type = htype_old;
1598header_list->text = NULL;
1599header_list->slen = 0;
1600
1601/* Control block for the next header to be read. */
1602
1603next = store_get(sizeof(header_line));
1604next->text = store_get(header_size);
1605
1606/* Initialize message id to be null (indicating no message read), and the
1607header names list to be the normal list. Indicate there is no data file open
1608yet, initialize the size and warning count, and deal with no size limit. */
1609
1610message_id[0] = 0;
1611data_file = NULL;
1612data_fd = -1;
41313d92 1613spool_name = US"";
059ec3d9
PH
1614message_size = 0;
1615warning_count = 0;
d677b2f2 1616received_count = 1; /* For the one we will add */
059ec3d9
PH
1617
1618if (thismessage_size_limit <= 0) thismessage_size_limit = INT_MAX;
1619
2e0c1448 1620/* While reading the message, the following counts are computed. */
059ec3d9 1621
d677b2f2
PH
1622message_linecount = body_linecount = body_zerocount =
1623 max_received_linelength = 0;
059ec3d9 1624
80a47a2c 1625#ifndef DISABLE_DKIM
e983e85a
JH
1626/* Call into DKIM to set up the context. In CHUNKING mode
1627we clear the dot-stuffing flag */
1628if (smtp_input && !smtp_batched_input && !dkim_disable_verify)
1629 dkim_exim_verify_init(chunking_state <= CHUNKING_OFFERED);
fb2274d4
TK
1630#endif
1631
4840604e
TL
1632#ifdef EXPERIMENTAL_DMARC
1633/* initialize libopendmarc */
1634dmarc_up = dmarc_init();
1635#endif
1636
059ec3d9
PH
1637/* Remember the time of reception. Exim uses time+pid for uniqueness of message
1638ids, and fractions of a second are required. See the comments that precede the
1639message id creation below. */
1640
1641(void)gettimeofday(&message_id_tv, NULL);
1642
1643/* For other uses of the received time we can operate with granularity of one
1644second, and for that we use the global variable received_time. This is for
1645things like ultimate message timeouts. */
1646
1647received_time = message_id_tv.tv_sec;
1648
1649/* If SMTP input, set the special handler for timeouts. The alarm() calls
1650happen in the smtp_getc() function when it refills its buffer. */
1651
1652if (smtp_input) os_non_restarting_signal(SIGALRM, data_timeout_handler);
1653
1654/* If not SMTP input, timeout happens only if configured, and we just set a
1655single timeout for the whole message. */
1656
1657else if (receive_timeout > 0)
1658 {
1659 os_non_restarting_signal(SIGALRM, data_timeout_handler);
1660 alarm(receive_timeout);
1661 }
1662
1663/* SIGTERM and SIGINT are caught always. */
1664
1665signal(SIGTERM, data_sigterm_sigint_handler);
1666signal(SIGINT, data_sigterm_sigint_handler);
1667
1668/* Header lines in messages are not supposed to be very long, though when
1669unfolded, to: and cc: headers can take up a lot of store. We must also cope
1670with the possibility of junk being thrown at us. Start by getting 256 bytes for
1671storing the header, and extend this as necessary using string_cat().
1672
1673To cope with total lunacies, impose an upper limit on the length of the header
1674section of the message, as otherwise the store will fill up. We must also cope
1675with the possibility of binary zeros in the data. Hence we cannot use fgets().
1676Folded header lines are joined into one string, leaving the '\n' characters
1677inside them, so that writing them out reproduces the input.
1678
1679Loop for each character of each header; the next structure for chaining the
1680header is set up already, with ptr the offset of the next character in
1681next->text. */
1682
1683for (;;)
1684 {
80a47a2c 1685 int ch = (receive_getc)();
059ec3d9
PH
1686
1687 /* If we hit EOF on a SMTP connection, it's an error, since incoming
1688 SMTP must have a correct "." terminator. */
1689
1690 if (ch == EOF && smtp_input /* && !smtp_batched_input */)
1691 {
1692 smtp_reply = handle_lost_connection(US" (header)");
1693 smtp_yield = FALSE;
1694 goto TIDYUP; /* Skip to end of function */
1695 }
1696
1697 /* See if we are at the current header's size limit - there must be at least
1698 four bytes left. This allows for the new character plus a zero, plus two for
1699 extra insertions when we are playing games with dots and carriage returns. If
1700 we are at the limit, extend the text buffer. This could have been done
1701 automatically using string_cat() but because this is a tightish loop storing
1702 only one character at a time, we choose to do it inline. Normally
1703 store_extend() will be able to extend the block; only at the end of a big
1704 store block will a copy be needed. To handle the case of very long headers
1705 (and sometimes lunatic messages can have ones that are 100s of K long) we
1706 call store_release() for strings that have been copied - if the string is at
1707 the start of a block (and therefore the only thing in it, because we aren't
1708 doing any other gets), the block gets freed. We can only do this because we
1709 know there are no other calls to store_get() going on. */
1710
1711 if (ptr >= header_size - 4)
1712 {
1713 int oldsize = header_size;
1714 /* header_size += 256; */
1715 header_size *= 2;
1716 if (!store_extend(next->text, oldsize, header_size))
1717 {
1718 uschar *newtext = store_get(header_size);
1719 memcpy(newtext, next->text, ptr);
1720 store_release(next->text);
1721 next->text = newtext;
1722 }
1723 }
1724
1725 /* Cope with receiving a binary zero. There is dispute about whether
1726 these should be allowed in RFC 822 messages. The middle view is that they
1727 should not be allowed in headers, at least. Exim takes this attitude at
1728 the moment. We can't just stomp on them here, because we don't know that
1729 this line is a header yet. Set a flag to cause scanning later. */
1730
1731 if (ch == 0) had_zero++;
1732
1733 /* Test for termination. Lines in remote SMTP are terminated by CRLF, while
1734 those from data files use just LF. Treat LF in local SMTP input as a
1735 terminator too. Treat EOF as a line terminator always. */
1736
1737 if (ch == EOF) goto EOL;
1738
1739 /* FUDGE: There are sites out there that don't send CRs before their LFs, and
1740 other MTAs accept this. We are therefore forced into this "liberalisation"
1741 too, so we accept LF as a line terminator whatever the source of the message.
1742 However, if the first line of the message ended with a CRLF, we treat a bare
1743 LF specially by inserting a white space after it to ensure that the header
1744 line is not terminated. */
1745
1746 if (ch == '\n')
1747 {
1748 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = FALSE;
80a47a2c 1749 else if (first_line_ended_crlf) receive_ungetc(' ');
059ec3d9
PH
1750 goto EOL;
1751 }
1752
1753 /* This is not the end of the line. If this is SMTP input and this is
1754 the first character in the line and it is a "." character, ignore it.
1755 This implements the dot-doubling rule, though header lines starting with
1756 dots aren't exactly common. They are legal in RFC 822, though. If the
1757 following is CRLF or LF, this is the line that that terminates the
1758 entire message. We set message_ended to indicate this has happened (to
1759 prevent further reading), and break out of the loop, having freed the
1760 empty header, and set next = NULL to indicate no data line. */
1761
1762 if (ptr == 0 && ch == '.' && (smtp_input || dot_ends))
1763 {
80a47a2c 1764 ch = (receive_getc)();
059ec3d9
PH
1765 if (ch == '\r')
1766 {
80a47a2c 1767 ch = (receive_getc)();
059ec3d9
PH
1768 if (ch != '\n')
1769 {
80a47a2c 1770 receive_ungetc(ch);
059ec3d9
PH
1771 ch = '\r'; /* Revert to CR */
1772 }
1773 }
1774 if (ch == '\n')
1775 {
1776 message_ended = END_DOT;
1777 store_reset(next);
1778 next = NULL;
1779 break; /* End character-reading loop */
1780 }
1781
1782 /* For non-SMTP input, the dot at the start of the line was really a data
1783 character. What is now in ch is the following character. We guaranteed
1784 enough space for this above. */
1785
1786 if (!smtp_input)
1787 {
1788 next->text[ptr++] = '.';
1789 message_size++;
1790 }
1791 }
1792
1793 /* If CR is immediately followed by LF, end the line, ignoring the CR, and
1794 remember this case if this is the first line ending. */
1795
1796 if (ch == '\r')
1797 {
80a47a2c 1798 ch = (receive_getc)();
059ec3d9
PH
1799 if (ch == '\n')
1800 {
1801 if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = TRUE;
1802 goto EOL;
1803 }
1804
1805 /* Otherwise, put back the character after CR, and turn the bare CR
1806 into LF SP. */
1807
80a47a2c 1808 ch = (receive_ungetc)(ch);
059ec3d9
PH
1809 next->text[ptr++] = '\n';
1810 message_size++;
1811 ch = ' ';
1812 }
1813
1814 /* We have a data character for the header line. */
1815
1816 next->text[ptr++] = ch; /* Add to buffer */
1817 message_size++; /* Total message size so far */
1818
1819 /* Handle failure due to a humungously long header section. The >= allows
1820 for the terminating \n. Add what we have so far onto the headers list so
1821 that it gets reflected in any error message, and back up the just-read
1822 character. */
1823
1824 if (message_size >= header_maxsize)
1825 {
1826 next->text[ptr] = 0;
1827 next->slen = ptr;
1828 next->type = htype_other;
1829 next->next = NULL;
1830 header_last->next = next;
1831 header_last = next;
1832
1833 log_write(0, LOG_MAIN, "ridiculously long message header received from "
1834 "%s (more than %d characters): message abandoned",
1835 sender_host_unknown? sender_ident : sender_fullhost, header_maxsize);
1836
1837 if (smtp_input)
1838 {
1839 smtp_reply = US"552 Message header is ridiculously long";
1840 receive_swallow_smtp();
1841 goto TIDYUP; /* Skip to end of function */
1842 }
1843
1844 else
1845 {
1846 give_local_error(ERRMESS_VLONGHEADER,
1847 string_sprintf("message header longer than %d characters received: "
1848 "message not accepted", header_maxsize), US"", error_rc, stdin,
1849 header_list->next);
1850 /* Does not return */
1851 }
1852 }
1853
1854 continue; /* With next input character */
1855
1856 /* End of header line reached */
1857
1858 EOL:
2e0c1448
PH
1859
1860 /* Keep track of lines for BSMTP errors and overall message_linecount. */
1861
1862 receive_linecount++;
1863 message_linecount++;
059ec3d9 1864
d677b2f2
PH
1865 /* Keep track of maximum line length */
1866
1867 if (ptr - prevlines_length > max_received_linelength)
1868 max_received_linelength = ptr - prevlines_length;
1869 prevlines_length = ptr + 1;
1870
059ec3d9
PH
1871 /* Now put in the terminating newline. There is always space for
1872 at least two more characters. */
1873
1874 next->text[ptr++] = '\n';
1875 message_size++;
1876
1877 /* A blank line signals the end of the headers; release the unwanted
1878 space and set next to NULL to indicate this. */
1879
1880 if (ptr == 1)
1881 {
1882 store_reset(next);
1883 next = NULL;
1884 break;
1885 }
1886
1887 /* There is data in the line; see if the next input character is a
1888 whitespace character. If it is, we have a continuation of this header line.
1889 There is always space for at least one character at this point. */
1890
1891 if (ch != EOF)
1892 {
80a47a2c 1893 int nextch = (receive_getc)();
059ec3d9
PH
1894 if (nextch == ' ' || nextch == '\t')
1895 {
1896 next->text[ptr++] = nextch;
1897 message_size++;
1898 continue; /* Iterate the loop */
1899 }
80a47a2c 1900 else if (nextch != EOF) (receive_ungetc)(nextch); /* For next time */
059ec3d9
PH
1901 else ch = EOF; /* Cause main loop to exit at end */
1902 }
1903
1904 /* We have got to the real line end. Terminate the string and release store
1905 beyond it. If it turns out to be a real header, internal binary zeros will
1906 be squashed later. */
1907
1908 next->text[ptr] = 0;
1909 next->slen = ptr;
1910 store_reset(next->text + ptr + 1);
1911
1912 /* Check the running total size against the overall message size limit. We
1913 don't expect to fail here, but if the overall limit is set less than MESSAGE_
1914 MAXSIZE and a big header is sent, we want to catch it. Just stop reading
1915 headers - the code to read the body will then also hit the buffer. */
1916
1917 if (message_size > thismessage_size_limit) break;
1918
1919 /* A line that is not syntactically correct for a header also marks
1920 the end of the headers. In this case, we leave next containing the
1921 first data line. This might actually be several lines because of the
1922 continuation logic applied above, but that doesn't matter.
1923
1924 It turns out that smail, and presumably sendmail, accept leading lines
1925 of the form
1926
1927 From ph10 Fri Jan 5 12:35 GMT 1996
1928
1929 in messages. The "mail" command on Solaris 2 sends such lines. I cannot
1930 find any documentation of this, but for compatibility it had better be
1931 accepted. Exim restricts it to the case of non-smtp messages, and
1932 treats it as an alternative to the -f command line option. Thus it is
1933 ignored except for trusted users or filter testing. Otherwise it is taken
1934 as the sender address, unless -f was used (sendmail compatibility).
1935
1936 It further turns out that some UUCPs generate the From_line in a different
1937 format, e.g.
1938
1939 From ph10 Fri, 7 Jan 97 14:00:00 GMT
1940
1941 The regex for matching these things is now capable of recognizing both
1942 formats (including 2- and 4-digit years in the latter). In fact, the regex
1943 is now configurable, as is the expansion string to fish out the sender.
1944
1945 Even further on it has been discovered that some broken clients send
1946 these lines in SMTP messages. There is now an option to ignore them from
1947 specified hosts or networks. Sigh. */
1948
1949 if (header_last == header_list &&
1950 (!smtp_input
1951 ||
1952 (sender_host_address != NULL &&
1953 verify_check_host(&ignore_fromline_hosts) == OK)
1954 ||
1955 (sender_host_address == NULL && ignore_fromline_local)
1956 ) &&
1957 regex_match_and_setup(regex_From, next->text, 0, -1))
1958 {
1959 if (!sender_address_forced)
1960 {
1961 uschar *uucp_sender = expand_string(uucp_from_sender);
1962 if (uucp_sender == NULL)
1963 {
1964 log_write(0, LOG_MAIN|LOG_PANIC,
1965 "expansion of \"%s\" failed after matching "
1966 "\"From \" line: %s", uucp_from_sender, expand_string_message);
1967 }
1968 else
1969 {
1970 int start, end, domain;
1971 uschar *errmess;
1972 uschar *newsender = parse_extract_address(uucp_sender, &errmess,
1973 &start, &end, &domain, TRUE);
1974 if (newsender != NULL)
1975 {
1976 if (domain == 0 && newsender[0] != 0)
1977 newsender = rewrite_address_qualify(newsender, FALSE);
1978
f05da2e8 1979 if (filter_test != FTEST_NONE || receive_check_set_sender(newsender))
059ec3d9
PH
1980 {
1981 sender_address = newsender;
1982
f05da2e8 1983 if (trusted_caller || filter_test != FTEST_NONE)
059ec3d9
PH
1984 {
1985 authenticated_sender = NULL;
1986 originator_name = US"";
1987 sender_local = FALSE;
1988 }
1989
f05da2e8 1990 if (filter_test != FTEST_NONE)
059ec3d9
PH
1991 printf("Sender taken from \"From \" line\n");
1992 }
1993 }
1994 }
1995 }
1996 }
1997
1998 /* Not a leading "From " line. Check to see if it is a valid header line.
1999 Header names may contain any non-control characters except space and colon,
2000 amazingly. */
2001
2002 else
2003 {
2004 uschar *p = next->text;
2005
2006 /* If not a valid header line, break from the header reading loop, leaving
2007 next != NULL, indicating that it holds the first line of the body. */
2008
2009 if (isspace(*p)) break;
2010 while (mac_isgraph(*p) && *p != ':') p++;
2011 while (isspace(*p)) p++;
2012 if (*p != ':')
2013 {
2014 body_zerocount = had_zero;
2015 break;
2016 }
2017
2018 /* We have a valid header line. If there were any binary zeroes in
2019 the line, stomp on them here. */
2020
2021 if (had_zero > 0)
2022 for (p = next->text; p < next->text + ptr; p++) if (*p == 0) *p = '?';
2023
2024 /* It is perfectly legal to have an empty continuation line
2025 at the end of a header, but it is confusing to humans
2026 looking at such messages, since it looks like a blank line.
2027 Reduce confusion by removing redundant white space at the
2028 end. We know that there is at least one printing character
2029 (the ':' tested for above) so there is no danger of running
2030 off the end. */
2031
2032 p = next->text + ptr - 2;
2033 for (;;)
2034 {
2035 while (*p == ' ' || *p == '\t') p--;
2036 if (*p != '\n') break;
2037 ptr = (p--) - next->text + 1;
2038 message_size -= next->slen - ptr;
2039 next->text[ptr] = 0;
2040 next->slen = ptr;
2041 }
2042
2043 /* Add the header to the chain */
2044
2045 next->type = htype_other;
2046 next->next = NULL;
2047 header_last->next = next;
2048 header_last = next;
2049
2050 /* Check the limit for individual line lengths. This comes after adding to
2051 the chain so that the failing line is reflected if a bounce is generated
2052 (for a local message). */
2053
2054 if (header_line_maxsize > 0 && next->slen > header_line_maxsize)
2055 {
2056 log_write(0, LOG_MAIN, "overlong message header line received from "
2057 "%s (more than %d characters): message abandoned",
2058 sender_host_unknown? sender_ident : sender_fullhost,
2059 header_line_maxsize);
2060
2061 if (smtp_input)
2062 {
2063 smtp_reply = US"552 A message header line is too long";
2064 receive_swallow_smtp();
2065 goto TIDYUP; /* Skip to end of function */
2066 }
2067
2068 else
2069 {
2070 give_local_error(ERRMESS_VLONGHDRLINE,
2071 string_sprintf("message header line longer than %d characters "
2072 "received: message not accepted", header_line_maxsize), US"",
2073 error_rc, stdin, header_list->next);
2074 /* Does not return */
2075 }
2076 }
2077
2078 /* Note if any resent- fields exist. */
2079
2080 if (!resents_exist && strncmpic(next->text, US"resent-", 7) == 0)
2081 {
2082 resents_exist = TRUE;
2083 resent_prefix = US"Resent-";
2084 }
2085 }
2086
2087 /* The line has been handled. If we have hit EOF, break out of the loop,
2088 indicating no pending data line. */
2089
2090 if (ch == EOF) { next = NULL; break; }
2091
2092 /* Set up for the next header */
2093
2094 header_size = 256;
2095 next = store_get(sizeof(header_line));
2096 next->text = store_get(header_size);
2097 ptr = 0;
2098 had_zero = 0;
d677b2f2 2099 prevlines_length = 0;
059ec3d9
PH
2100 } /* Continue, starting to read the next header */
2101
2102/* At this point, we have read all the headers into a data structure in main
2103store. The first header is still the dummy placeholder for the Received: header
2104we are going to generate a bit later on. If next != NULL, it contains the first
2105data line - which terminated the headers before reaching a blank line (not the
2106normal case). */
2107
2108DEBUG(D_receive)
2109 {
2110 debug_printf(">>Headers received:\n");
2111 for (h = header_list->next; h != NULL; h = h->next)
2112 debug_printf("%s", h->text);
2113 debug_printf("\n");
2114 }
2115
2116/* End of file on any SMTP connection is an error. If an incoming SMTP call
2117is dropped immediately after valid headers, the next thing we will see is EOF.
2118We must test for this specially, as further down the reading of the data is
2119skipped if already at EOF. */
2120
2121if (smtp_input && (receive_feof)())
2122 {
2123 smtp_reply = handle_lost_connection(US" (after header)");
2124 smtp_yield = FALSE;
2125 goto TIDYUP; /* Skip to end of function */
2126 }
2127
2128/* If this is a filter test run and no headers were read, output a warning
2129in case there is a mistake in the test message. */
2130
f05da2e8 2131if (filter_test != FTEST_NONE && header_list->next == NULL)
059ec3d9
PH
2132 printf("Warning: no message headers read\n");
2133
2134
2135/* Scan the headers to identify them. Some are merely marked for later
2136processing; some are dealt with here. */
2137
2138for (h = header_list->next; h != NULL; h = h->next)
2139 {
2140 BOOL is_resent = strncmpic(h->text, US"resent-", 7) == 0;
2141 if (is_resent) contains_resent_headers = TRUE;
2142
2143 switch (header_checkname(h, is_resent))
2144 {
059ec3d9 2145 case htype_bcc:
2cbb4081 2146 h->type = htype_bcc; /* Both Bcc: and Resent-Bcc: */
059ec3d9
PH
2147 break;
2148
059ec3d9 2149 case htype_cc:
2cbb4081 2150 h->type = htype_cc; /* Both Cc: and Resent-Cc: */
059ec3d9
PH
2151 break;
2152
2153 /* Record whether a Date: or Resent-Date: header exists, as appropriate. */
2154
2155 case htype_date:
4c69d561 2156 if (!resents_exist || is_resent) date_header_exists = TRUE;
059ec3d9
PH
2157 break;
2158
2159 /* Same comments as about Return-Path: below. */
2160
2161 case htype_delivery_date:
2162 if (delivery_date_remove) h->type = htype_old;
2163 break;
2164
2165 /* Same comments as about Return-Path: below. */
2166
2167 case htype_envelope_to:
2168 if (envelope_to_remove) h->type = htype_old;
2169 break;
2170
2171 /* Mark all "From:" headers so they get rewritten. Save the one that is to
2172 be used for Sender: checking. For Sendmail compatibility, if the "From:"
2173 header consists of just the login id of the user who called Exim, rewrite
2174 it with the gecos field first. Apply this rule to Resent-From: if there
2175 are resent- fields. */
2176
2177 case htype_from:
2178 h->type = htype_from;
2179 if (!resents_exist || is_resent)
2180 {
2181 from_header = h;
2182 if (!smtp_input)
2183 {
5de8faa3 2184 int len;
059ec3d9
PH
2185 uschar *s = Ustrchr(h->text, ':') + 1;
2186 while (isspace(*s)) s++;
5de8faa3 2187 len = h->slen - (s - h->text) - 1;
e0fccd1d
TF
2188 if (Ustrlen(originator_login) == len &&
2189 strncmpic(s, originator_login, len) == 0)
059ec3d9
PH
2190 {
2191 uschar *name = is_resent? US"Resent-From" : US"From";
2192 header_add(htype_from, "%s: %s <%s@%s>\n", name, originator_name,
2193 originator_login, qualify_domain_sender);
2194 from_header = header_last;
2195 h->type = htype_old;
2196 DEBUG(D_receive|D_rewrite)
2197 debug_printf("rewrote \"%s:\" header using gecos\n", name);
2198 }
2199 }
2200 }
2201 break;
2202
2203 /* Identify the Message-id: header for generating "in-reply-to" in the
2204 autoreply transport. For incoming logging, save any resent- value. In both
2205 cases, take just the first of any multiples. */
2206
2207 case htype_id:
2208 if (msgid_header == NULL && (!resents_exist || is_resent))
2209 {
2210 msgid_header = h;
2211 h->type = htype_id;
2212 }
2213 break;
2214
2215 /* Flag all Received: headers */
2216
2217 case htype_received:
2218 h->type = htype_received;
2219 received_count++;
2220 break;
2221
2222 /* "Reply-to:" is just noted (there is no resent-reply-to field) */
2223
2224 case htype_reply_to:
2225 h->type = htype_reply_to;
2226 break;
2227
2228 /* The Return-path: header is supposed to be added to messages when
2229 they leave the SMTP system. We shouldn't receive messages that already
2230 contain Return-path. However, since Exim generates Return-path: on
2231 local delivery, resent messages may well contain it. We therefore
2232 provide an option (which defaults on) to remove any Return-path: headers
2233 on input. Removal actually means flagging as "old", which prevents the
2234 header being transmitted with the message. */
2235
2236 case htype_return_path:
2237 if (return_path_remove) h->type = htype_old;
2238
2239 /* If we are testing a mail filter file, use the value of the
2240 Return-Path: header to set up the return_path variable, which is not
2241 otherwise set. However, remove any <> that surround the address
2242 because the variable doesn't have these. */
2243
f05da2e8 2244 if (filter_test != FTEST_NONE)
059ec3d9
PH
2245 {
2246 uschar *start = h->text + 12;
2247 uschar *end = start + Ustrlen(start);
2248 while (isspace(*start)) start++;
2249 while (end > start && isspace(end[-1])) end--;
2250 if (*start == '<' && end[-1] == '>')
2251 {
2252 start++;
2253 end--;
2254 }
2255 return_path = string_copyn(start, end - start);
2256 printf("Return-path taken from \"Return-path:\" header line\n");
2257 }
2258 break;
2259
2260 /* If there is a "Sender:" header and the message is locally originated,
8800895a
PH
2261 and from an untrusted caller and suppress_local_fixups is not set, or if we
2262 are in submission mode for a remote message, mark it "old" so that it will
2263 not be transmitted with the message, unless active_local_sender_retain is
2264 set. (This can only be true if active_local_from_check is false.) If there
2265 are any resent- headers in the message, apply this rule to Resent-Sender:
2266 instead of Sender:. Messages with multiple resent- header sets cannot be
2267 tidily handled. (For this reason, at least one MUA - Pine - turns old
2268 resent- headers into X-resent- headers when resending, leaving just one
2269 set.) */
059ec3d9
PH
2270
2271 case htype_sender:
69358f02 2272 h->type = ((!active_local_sender_retain &&
8800895a
PH
2273 (
2274 (sender_local && !trusted_caller && !suppress_local_fixups)
2275 || submission_mode
2276 )
059ec3d9
PH
2277 ) &&
2278 (!resents_exist||is_resent))?
2279 htype_old : htype_sender;
2280 break;
2281
2282 /* Remember the Subject: header for logging. There is no Resent-Subject */
2283
2284 case htype_subject:
2285 subject_header = h;
2286 break;
2287
2288 /* "To:" gets flagged, and the existence of a recipient header is noted,
2289 whether it's resent- or not. */
2290
2291 case htype_to:
2292 h->type = htype_to;
2293 /****
2294 to_or_cc_header_exists = TRUE;
2295 ****/
2296 break;
2297 }
2298 }
2299
2300/* Extract recipients from the headers if that is required (the -t option).
2301Note that this is documented as being done *before* any address rewriting takes
2302place. There are two possibilities:
2303
2304(1) According to sendmail documentation for Solaris, IRIX, and HP-UX, any
2305recipients already listed are to be REMOVED from the message. Smail 3 works
2306like this. We need to build a non-recipients tree for that list, because in
2307subsequent processing this data is held in a tree and that's what the
2308spool_write_header() function expects. Make sure that non-recipient addresses
2309are fully qualified and rewritten if necessary.
2310
2311(2) According to other sendmail documentation, -t ADDS extracted recipients to
2312those in the command line arguments (and it is rumoured some other MTAs do
2313this). Therefore, there is an option to make Exim behave this way.
2314
2315*** Notes on "Resent-" header lines ***
2316
2317The presence of resent-headers in the message makes -t horribly ambiguous.
2318Experiments with sendmail showed that it uses recipients for all resent-
2319headers, totally ignoring the concept of "sets of resent- headers" as described
2320in RFC 2822 section 3.6.6. Sendmail also amalgamates them into a single set
2321with all the addresses in one instance of each header.
2322
2323This seems to me not to be at all sensible. Before release 4.20, Exim 4 gave an
2324error for -t if there were resent- headers in the message. However, after a
2325discussion on the mailing list, I've learned that there are MUAs that use
2326resent- headers with -t, and also that the stuff about sets of resent- headers
2327and their ordering in RFC 2822 is generally ignored. An MUA that submits a
2328message with -t and resent- header lines makes sure that only *its* resent-
2329headers are present; previous ones are often renamed as X-resent- for example.
2330
2331Consequently, Exim has been changed so that, if any resent- header lines are
2332present, the recipients are taken from all of the appropriate resent- lines,
2333and not from the ordinary To:, Cc:, etc. */
2334
2335if (extract_recip)
2336 {
2337 int rcount = 0;
2338 error_block **bnext = &bad_addresses;
2339
2340 if (extract_addresses_remove_arguments)
2341 {
2342 while (recipients_count-- > 0)
2343 {
2344 uschar *s = rewrite_address(recipients_list[recipients_count].address,
2345 TRUE, TRUE, global_rewrite_rules, rewrite_existflags);
2346 tree_add_nonrecipient(s);
2347 }
2348 recipients_list = NULL;
2349 recipients_count = recipients_list_max = 0;
2350 }
2351
059ec3d9
PH
2352 /* Now scan the headers */
2353
2354 for (h = header_list->next; h != NULL; h = h->next)
2355 {
2356 if ((h->type == htype_to || h->type == htype_cc || h->type == htype_bcc) &&
2357 (!contains_resent_headers || strncmpic(h->text, US"resent-", 7) == 0))
2358 {
2359 uschar *s = Ustrchr(h->text, ':') + 1;
2360 while (isspace(*s)) s++;
2361
1eccaa59
PH
2362 parse_allow_group = TRUE; /* Allow address group syntax */
2363
059ec3d9
PH
2364 while (*s != 0)
2365 {
2366 uschar *ss = parse_find_address_end(s, FALSE);
2367 uschar *recipient, *errmess, *p, *pp;
2368 int start, end, domain;
2369
2370 /* Check on maximum */
2371
2372 if (recipients_max > 0 && ++rcount > recipients_max)
2373 {
2374 give_local_error(ERRMESS_TOOMANYRECIP, US"too many recipients",
2375 US"message rejected: ", error_rc, stdin, NULL);
2376 /* Does not return */
2377 }
2378
2379 /* Make a copy of the address, and remove any internal newlines. These
2380 may be present as a result of continuations of the header line. The
2381 white space that follows the newline must not be removed - it is part
2382 of the header. */
2383
2384 pp = recipient = store_get(ss - s + 1);
2385 for (p = s; p < ss; p++) if (*p != '\n') *pp++ = *p;
2386 *pp = 0;
250b6871 2387
8c5d388a 2388#ifdef SUPPORT_I18N
250b6871
JH
2389 {
2390 BOOL b = allow_utf8_domains;
2391 allow_utf8_domains = TRUE;
2392#endif
059ec3d9
PH
2393 recipient = parse_extract_address(recipient, &errmess, &start, &end,
2394 &domain, FALSE);
2395
8c5d388a 2396#ifdef SUPPORT_I18N
250b6871
JH
2397 if (string_is_utf8(recipient))
2398 message_smtputf8 = TRUE;
2399 else
2400 allow_utf8_domains = b;
2401 }
2402#endif
2403
059ec3d9
PH
2404 /* Keep a list of all the bad addresses so we can send a single
2405 error message at the end. However, an empty address is not an error;
2406 just ignore it. This can come from an empty group list like
2407
2408 To: Recipients of list:;
2409
2410 If there are no recipients at all, an error will occur later. */
2411
2412 if (recipient == NULL && Ustrcmp(errmess, "empty address") != 0)
2413 {
2414 int len = Ustrlen(s);
2415 error_block *b = store_get(sizeof(error_block));
2416 while (len > 0 && isspace(s[len-1])) len--;
2417 b->next = NULL;
2418 b->text1 = string_printing(string_copyn(s, len));
2419 b->text2 = errmess;
2420 *bnext = b;
2421 bnext = &(b->next);
2422 }
2423
2424 /* If the recipient is already in the nonrecipients tree, it must
2425 have appeared on the command line with the option extract_addresses_
2426 remove_arguments set. Do not add it to the recipients, and keep a note
2427 that this has happened, in order to give a better error if there are
2428 no recipients left. */
2429
2430 else if (recipient != NULL)
2431 {
2432 if (tree_search(tree_nonrecipients, recipient) == NULL)
2433 receive_add_recipient(recipient, -1);
2434 else
2435 extracted_ignored = TRUE;
2436 }
2437
2438 /* Move on past this address */
2439
2440 s = ss + (*ss? 1:0);
2441 while (isspace(*s)) s++;
1eccaa59
PH
2442 } /* Next address */
2443
2444 parse_allow_group = FALSE; /* Reset group syntax flags */
2445 parse_found_group = FALSE;
059ec3d9
PH
2446
2447 /* If this was the bcc: header, mark it "old", which means it
2448 will be kept on the spool, but not transmitted as part of the
2449 message. */
2450
2cbb4081 2451 if (h->type == htype_bcc) h->type = htype_old;
059ec3d9
PH
2452 } /* For appropriate header line */
2453 } /* For each header line */
2454
059ec3d9
PH
2455 }
2456
2457/* Now build the unique message id. This has changed several times over the
2458lifetime of Exim. This description was rewritten for Exim 4.14 (February 2003).
2459Retaining all the history in the comment has become too unwieldy - read
2460previous release sources if you want it.
2461
2462The message ID has 3 parts: tttttt-pppppp-ss. Each part is a number in base 62.
2463The first part is the current time, in seconds. The second part is the current
2464pid. Both are large enough to hold 32-bit numbers in base 62. The third part
2465can hold a number in the range 0-3843. It used to be a computed sequence
2466number, but is now the fractional component of the current time in units of
24671/2000 of a second (i.e. a value in the range 0-1999). After a message has been
2468received, Exim ensures that the timer has ticked at the appropriate level
2469before proceeding, to avoid duplication if the pid happened to be re-used
2470within the same time period. It seems likely that most messages will take at
2471least half a millisecond to be received, so no delay will normally be
2472necessary. At least for some time...
2473
2474There is a modification when localhost_number is set. Formerly this was allowed
2475to be as large as 255. Now it is restricted to the range 0-16, and the final
2476component of the message id becomes (localhost_number * 200) + fractional time
2477in units of 1/200 of a second (i.e. a value in the range 0-3399).
2478
2479Some not-really-Unix operating systems use case-insensitive file names (Darwin,
2480Cygwin). For these, we have to use base 36 instead of base 62. Luckily, this
2481still allows the tttttt field to hold a large enough number to last for some
2482more decades, and the final two-digit field can hold numbers up to 1295, which
2483is enough for milliseconds (instead of 1/2000 of a second).
2484
2485However, the pppppp field cannot hold a 32-bit pid, but it can hold a 31-bit
2486pid, so it is probably safe because pids have to be positive. The
2487localhost_number is restricted to 0-10 for these hosts, and when it is set, the
2488final field becomes (localhost_number * 100) + fractional time in centiseconds.
2489
2490Note that string_base62() returns its data in a static storage block, so it
2491must be copied before calling string_base62() again. It always returns exactly
24926 characters.
2493
2494There doesn't seem to be anything in the RFC which requires a message id to
2495start with a letter, but Smail was changed to ensure this. The external form of
2496the message id (as supplied by string expansion) therefore starts with an
2497additional leading 'E'. The spool file names do not include this leading
2498letter and it is not used internally.
2499
2500NOTE: If ever the format of message ids is changed, the regular expression for
2501checking that a string is in this format must be updated in a corresponding
2502way. It appears in the initializing code in exim.c. The macro MESSAGE_ID_LENGTH
2503must also be changed to reflect the correct string length. Then, of course,
2504other programs that rely on the message id format will need updating too. */
2505
2506Ustrncpy(message_id, string_base62((long int)(message_id_tv.tv_sec)), 6);
2507message_id[6] = '-';
2508Ustrncpy(message_id + 7, string_base62((long int)getpid()), 6);
2509
2510/* Deal with the case where the host number is set. The value of the number was
2511checked when it was read, to ensure it isn't too big. The timing granularity is
2512left in id_resolution so that an appropriate wait can be done after receiving
2513the message, if necessary (we hope it won't be). */
2514
2515if (host_number_string != NULL)
2516 {
2517 id_resolution = (BASE_62 == 62)? 5000 : 10000;
2518 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2519 string_base62((long int)(
2520 host_number * (1000000/id_resolution) +
2521 message_id_tv.tv_usec/id_resolution)) + 4);
2522 }
2523
2524/* Host number not set: final field is just the fractional time at an
2525appropriate resolution. */
2526
2527else
2528 {
2529 id_resolution = (BASE_62 == 62)? 500 : 1000;
2530 sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s",
2531 string_base62((long int)(message_id_tv.tv_usec/id_resolution)) + 4);
2532 }
2533
2534/* Add the current message id onto the current process info string if
2535it will fit. */
2536
2537(void)string_format(process_info + process_info_len,
2538 PROCESS_INFO_SIZE - process_info_len, " id=%s", message_id);
2539
2540/* If we are using multiple input directories, set up the one for this message
2541to be the least significant base-62 digit of the time of arrival. Otherwise
2542ensure that it is an empty string. */
2543
a2da3176 2544message_subdir[0] = split_spool_directory ? message_id[5] : 0;
059ec3d9
PH
2545
2546/* Now that we have the message-id, if there is no message-id: header, generate
8800895a
PH
2547one, but only for local (without suppress_local_fixups) or submission mode
2548messages. This can be user-configured if required, but we had better flatten
2549any illegal characters therein. */
059ec3d9 2550
8800895a
PH
2551if (msgid_header == NULL &&
2552 ((sender_host_address == NULL && !suppress_local_fixups)
2553 || submission_mode))
059ec3d9
PH
2554 {
2555 uschar *p;
2556 uschar *id_text = US"";
2557 uschar *id_domain = primary_hostname;
2558
2559 /* Permit only letters, digits, dots, and hyphens in the domain */
2560
2561 if (message_id_domain != NULL)
2562 {
2563 uschar *new_id_domain = expand_string(message_id_domain);
2564 if (new_id_domain == NULL)
2565 {
2566 if (!expand_string_forcedfail)
2567 log_write(0, LOG_MAIN|LOG_PANIC,
2568 "expansion of \"%s\" (message_id_header_domain) "
2569 "failed: %s", message_id_domain, expand_string_message);
2570 }
2571 else if (*new_id_domain != 0)
2572 {
2573 id_domain = new_id_domain;
2574 for (p = id_domain; *p != 0; p++)
2575 if (!isalnum(*p) && *p != '.') *p = '-'; /* No need to test '-' ! */
2576 }
2577 }
2578
2579 /* Permit all characters except controls and RFC 2822 specials in the
2580 additional text part. */
2581
2582 if (message_id_text != NULL)
2583 {
2584 uschar *new_id_text = expand_string(message_id_text);
2585 if (new_id_text == NULL)
2586 {
2587 if (!expand_string_forcedfail)
2588 log_write(0, LOG_MAIN|LOG_PANIC,
2589 "expansion of \"%s\" (message_id_header_text) "
2590 "failed: %s", message_id_text, expand_string_message);
2591 }
2592 else if (*new_id_text != 0)
2593 {
2594 id_text = new_id_text;
2595 for (p = id_text; *p != 0; p++)
2596 if (mac_iscntrl_or_special(*p)) *p = '-';
2597 }
2598 }
2599
e7e680d6
PP
2600 /* Add the header line
2601 * Resent-* headers are prepended, per RFC 5322 3.6.6. Non-Resent-* are
2602 * appended, to preserve classical expectations of header ordering. */
059ec3d9 2603
e7e680d6 2604 header_add_at_position(!resents_exist, NULL, FALSE, htype_id,
5eb690a1
NM
2605 "%sMessage-Id: <%s%s%s@%s>\n", resent_prefix, message_id_external,
2606 (*id_text == 0)? "" : ".", id_text, id_domain);
059ec3d9
PH
2607 }
2608
2609/* If we are to log recipients, keep a copy of the raw ones before any possible
2610rewriting. Must copy the count, because later ACLs and the local_scan()
2611function may mess with the real recipients. */
2612
6c6d6e48 2613if (LOGGING(received_recipients))
059ec3d9
PH
2614 {
2615 raw_recipients = store_get(recipients_count * sizeof(uschar *));
2616 for (i = 0; i < recipients_count; i++)
2617 raw_recipients[i] = string_copy(recipients_list[i].address);
2618 raw_recipients_count = recipients_count;
2619 }
2620
2621/* Ensure the recipients list is fully qualified and rewritten. Unqualified
2622recipients will get here only if the conditions were right (allow_unqualified_
2623recipient is TRUE). */
2624
2625for (i = 0; i < recipients_count; i++)
2626 recipients_list[i].address =
2627 rewrite_address(recipients_list[i].address, TRUE, TRUE,
2628 global_rewrite_rules, rewrite_existflags);
2629
8800895a
PH
2630/* If there is no From: header, generate one for local (without
2631suppress_local_fixups) or submission_mode messages. If there is no sender
2632address, but the sender is local or this is a local delivery error, use the
2633originator login. This shouldn't happen for genuine bounces, but might happen
2634for autoreplies. The addition of From: must be done *before* checking for the
2635possible addition of a Sender: header, because untrusted_set_sender allows an
2636untrusted user to set anything in the envelope (which might then get info
2637From:) but we still want to ensure a valid Sender: if it is required. */
2638
2639if (from_header == NULL &&
2640 ((sender_host_address == NULL && !suppress_local_fixups)
2641 || submission_mode))
059ec3d9 2642 {
2fe1a124
PH
2643 uschar *oname = US"";
2644
2645 /* Use the originator_name if this is a locally submitted message and the
2646 caller is not trusted. For trusted callers, use it only if -F was used to
2647 force its value or if we have a non-SMTP message for which -f was not used
2648 to set the sender. */
2649
2650 if (sender_host_address == NULL)
2651 {
2652 if (!trusted_caller || sender_name_forced ||
2653 (!smtp_input && !sender_address_forced))
2654 oname = originator_name;
2655 }
2656
2657 /* For non-locally submitted messages, the only time we use the originator
2658 name is when it was forced by the /name= option on control=submission. */
2659
2660 else
2661 {
2662 if (submission_name != NULL) oname = submission_name;
2663 }
2664
059ec3d9
PH
2665 /* Envelope sender is empty */
2666
2667 if (sender_address[0] == 0)
2668 {
87ba3f5f
PH
2669 uschar *fromstart, *fromend;
2670
2671 fromstart = string_sprintf("%sFrom: %s%s", resent_prefix,
2fe1a124
PH
2672 oname, (oname[0] == 0)? "" : " <");
2673 fromend = (oname[0] == 0)? US"" : US">";
87ba3f5f 2674
059ec3d9
PH
2675 if (sender_local || local_error_message)
2676 {
87ba3f5f
PH
2677 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2678 local_part_quote(originator_login), qualify_domain_sender,
2679 fromend);
059ec3d9
PH
2680 }
2681 else if (submission_mode && authenticated_id != NULL)
2682 {
2683 if (submission_domain == NULL)
2684 {
87ba3f5f
PH
2685 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2686 local_part_quote(authenticated_id), qualify_domain_sender,
2687 fromend);
059ec3d9
PH
2688 }
2689 else if (submission_domain[0] == 0) /* empty => whole address set */
2690 {
87ba3f5f
PH
2691 header_add(htype_from, "%s%s%s\n", fromstart, authenticated_id,
2692 fromend);
059ec3d9
PH
2693 }
2694 else
2695 {
87ba3f5f
PH
2696 header_add(htype_from, "%s%s@%s%s\n", fromstart,
2697 local_part_quote(authenticated_id), submission_domain,
2698 fromend);
059ec3d9
PH
2699 }
2700 from_header = header_last; /* To get it checked for Sender: */
2701 }
2702 }
2703
2704 /* There is a non-null envelope sender. Build the header using the original
2705 sender address, before any rewriting that might have been done while
2706 verifying it. */
2707
2708 else
2709 {
87ba3f5f 2710 header_add(htype_from, "%sFrom: %s%s%s%s\n", resent_prefix,
2fe1a124
PH
2711 oname,
2712 (oname[0] == 0)? "" : " <",
87ba3f5f
PH
2713 (sender_address_unrewritten == NULL)?
2714 sender_address : sender_address_unrewritten,
2fe1a124 2715 (oname[0] == 0)? "" : ">");
059ec3d9
PH
2716
2717 from_header = header_last; /* To get it checked for Sender: */
2718 }
2719 }
2720
2721
8800895a
PH
2722/* If the sender is local (without suppress_local_fixups), or if we are in
2723submission mode and there is an authenticated_id, check that an existing From:
2724is correct, and if not, generate a Sender: header, unless disabled. Any
2725previously-existing Sender: header was removed above. Note that sender_local,
2726as well as being TRUE if the caller of exim is not trusted, is also true if a
2727trusted caller did not supply a -f argument for non-smtp input. To allow
2728trusted callers to forge From: without supplying -f, we have to test explicitly
2729here. If the From: header contains more than one address, then the call to
2730parse_extract_address fails, and a Sender: header is inserted, as required. */
059ec3d9
PH
2731
2732if (from_header != NULL &&
69358f02 2733 (active_local_from_check &&
8800895a 2734 ((sender_local && !trusted_caller && !suppress_local_fixups) ||
69358f02 2735 (submission_mode && authenticated_id != NULL))
059ec3d9
PH
2736 ))
2737 {
2738 BOOL make_sender = TRUE;
2739 int start, end, domain;
2740 uschar *errmess;
2741 uschar *from_address =
2742 parse_extract_address(Ustrchr(from_header->text, ':') + 1, &errmess,
2743 &start, &end, &domain, FALSE);
2744 uschar *generated_sender_address;
2745
2746 if (submission_mode)
2747 {
2748 if (submission_domain == NULL)
2749 {
2750 generated_sender_address = string_sprintf("%s@%s",
2751 local_part_quote(authenticated_id), qualify_domain_sender);
2752 }
2753 else if (submission_domain[0] == 0) /* empty => full address */
2754 {
2755 generated_sender_address = string_sprintf("%s",
2756 authenticated_id);
2757 }
2758 else
2759 {
2760 generated_sender_address = string_sprintf("%s@%s",
2761 local_part_quote(authenticated_id), submission_domain);
2762 }
2763 }
2764 else
2765 generated_sender_address = string_sprintf("%s@%s",
2766 local_part_quote(originator_login), qualify_domain_sender);
2767
2768 /* Remove permitted prefixes and suffixes from the local part of the From:
2769 address before doing the comparison with the generated sender. */
2770
2771 if (from_address != NULL)
2772 {
2773 int slen;
2774 uschar *at = (domain == 0)? NULL : from_address + domain - 1;
2775
2776 if (at != NULL) *at = 0;
2777 from_address += route_check_prefix(from_address, local_from_prefix);
2778 slen = route_check_suffix(from_address, local_from_suffix);
2779 if (slen > 0)
2780 {
2781 memmove(from_address+slen, from_address, Ustrlen(from_address)-slen);
2782 from_address += slen;
2783 }
2784 if (at != NULL) *at = '@';
2785
2786 if (strcmpic(generated_sender_address, from_address) == 0 ||
2787 (domain == 0 && strcmpic(from_address, originator_login) == 0))
2788 make_sender = FALSE;
2789 }
2790
2791 /* We have to cause the Sender header to be rewritten if there are
2792 appropriate rewriting rules. */
2793
2794 if (make_sender)
2795 {
2fe1a124 2796 if (submission_mode && submission_name == NULL)
059ec3d9
PH
2797 header_add(htype_sender, "%sSender: %s\n", resent_prefix,
2798 generated_sender_address);
2799 else
2800 header_add(htype_sender, "%sSender: %s <%s>\n",
2fe1a124
PH
2801 resent_prefix,
2802 submission_mode? submission_name : originator_name,
2803 generated_sender_address);
059ec3d9 2804 }
87ba3f5f
PH
2805
2806 /* Ensure that a non-null envelope sender address corresponds to the
2807 submission mode sender address. */
2808
2809 if (submission_mode && sender_address[0] != 0)
2810 {
2811 if (sender_address_unrewritten == NULL)
2812 sender_address_unrewritten = sender_address;
2813 sender_address = generated_sender_address;
089793a4
TF
2814 if (Ustrcmp(sender_address_unrewritten, generated_sender_address) != 0)
2815 log_write(L_address_rewrite, LOG_MAIN,
2816 "\"%s\" from env-from rewritten as \"%s\" by submission mode",
2817 sender_address_unrewritten, generated_sender_address);
87ba3f5f 2818 }
059ec3d9
PH
2819 }
2820
059ec3d9
PH
2821/* If there are any rewriting rules, apply them to the sender address, unless
2822it has already been rewritten as part of verification for SMTP input. */
2823
2824if (global_rewrite_rules != NULL && sender_address_unrewritten == NULL &&
2825 sender_address[0] != 0)
2826 {
2827 sender_address = rewrite_address(sender_address, FALSE, TRUE,
2828 global_rewrite_rules, rewrite_existflags);
2829 DEBUG(D_receive|D_rewrite)
2830 debug_printf("rewritten sender = %s\n", sender_address);
2831 }
2832
2833
2834/* The headers must be run through rewrite_header(), because it ensures that
2835addresses are fully qualified, as well as applying any rewriting rules that may
2836exist.
2837
2838Qualification of header addresses in a message from a remote host happens only
2839if the host is in sender_unqualified_hosts or recipient_unqualified hosts, as
2840appropriate. For local messages, qualification always happens, unless -bnq is
2841used to explicitly suppress it. No rewriting is done for an unqualified address
2842that is left untouched.
2843
2844We start at the second header, skipping our own Received:. This rewriting is
2845documented as happening *after* recipient addresses are taken from the headers
2846by the -t command line option. An added Sender: gets rewritten here. */
2847
2848for (h = header_list->next; h != NULL; h = h->next)
2849 {
2850 header_line *newh = rewrite_header(h, NULL, NULL, global_rewrite_rules,
2851 rewrite_existflags, TRUE);
2852 if (newh != NULL) h = newh;
2853 }
2854
2855
2856/* An RFC 822 (sic) message is not legal unless it has at least one of "to",
2cbb4081 2857"cc", or "bcc". Note that although the minimal examples in RFC 822 show just
059ec3d9
PH
2858"to" or "bcc", the full syntax spec allows "cc" as well. If any resent- header
2859exists, this applies to the set of resent- headers rather than the normal set.
2860
2cbb4081
PH
2861The requirement for a recipient header has been removed in RFC 2822. At this
2862point in the code, earlier versions of Exim added a To: header for locally
2863submitted messages, and an empty Bcc: header for others. In the light of the
2864changes in RFC 2822, this was dropped in November 2003. */
059ec3d9 2865
059ec3d9
PH
2866
2867/* If there is no date header, generate one if the message originates locally
8800895a
PH
2868(i.e. not over TCP/IP) and suppress_local_fixups is not set, or if the
2869submission mode flag is set. Messages without Date: are not valid, but it seems
e7e680d6
PP
2870to be more confusing if Exim adds one to all remotely-originated messages.
2871As per Message-Id, we prepend if resending, else append.
2872*/
059ec3d9 2873
8800895a
PH
2874if (!date_header_exists &&
2875 ((sender_host_address == NULL && !suppress_local_fixups)
2876 || submission_mode))
e7e680d6
PP
2877 header_add_at_position(!resents_exist, NULL, FALSE, htype_other,
2878 "%sDate: %s\n", resent_prefix, tod_stamp(tod_full));
059ec3d9
PH
2879
2880search_tidyup(); /* Free any cached resources */
2881
2882/* Show the complete set of headers if debugging. Note that the first one (the
2883new Received:) has not yet been set. */
2884
2885DEBUG(D_receive)
2886 {
2887 debug_printf(">>Headers after rewriting and local additions:\n");
2888 for (h = header_list->next; h != NULL; h = h->next)
2889 debug_printf("%c %s", h->type, h->text);
2890 debug_printf("\n");
2891 }
2892
2893/* The headers are now complete in store. If we are running in filter
2894testing mode, that is all this function does. Return TRUE if the message
2895ended with a dot. */
2896
f05da2e8 2897if (filter_test != FTEST_NONE)
059ec3d9
PH
2898 {
2899 process_info[process_info_len] = 0;
2900 return message_ended == END_DOT;
2901 }
2902
7e3ce68e
JH
2903/*XXX CHUNKING: need to cancel cutthrough under BDAT, for now. In future,
2904think more if it could be handled. Cannot do onward CHUNKING unless
2905inbound is, but inbound chunking ought to be ok with outbound plain.
2906Could we do onward CHUNKING given inbound CHUNKING?
2907*/
2908if (chunking_state > CHUNKING_OFFERED)
2909 cancel_cutthrough_connection("chunking active");
2910
817d9f57 2911/* Cutthrough delivery:
5032d1cf
JH
2912We have to create the Received header now rather than at the end of reception,
2913so the timestamp behaviour is a change to the normal case.
2914XXX Ensure this gets documented XXX.
2915Having created it, send the headers to the destination. */
2916if (cutthrough.fd >= 0)
e4bdf652 2917 {
817d9f57
JH
2918 if (received_count > received_headers_max)
2919 {
2e5b33cd 2920 cancel_cutthrough_connection("too many headers");
817d9f57
JH
2921 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
2922 log_write(0, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
2923 "Too many \"Received\" headers",
2924 sender_address,
2925 (sender_fullhost == NULL)? "" : " H=",
2926 (sender_fullhost == NULL)? US"" : sender_fullhost,
2927 (sender_ident == NULL)? "" : " U=",
2928 (sender_ident == NULL)? US"" : sender_ident);
2929 message_id[0] = 0; /* Indicate no message accepted */
2930 smtp_reply = US"550 Too many \"Received\" headers - suspected mail loop";
2931 goto TIDYUP; /* Skip to end of function */
2932 }
e4bdf652 2933 received_header_gen();
578d43dc 2934 add_acl_headers(ACL_WHERE_RCPT, US"MAIL or RCPT");
e4bdf652
JH
2935 (void) cutthrough_headers_send();
2936 }
61147df4 2937
e4bdf652 2938
059ec3d9
PH
2939/* Open a new spool file for the data portion of the message. We need
2940to access it both via a file descriptor and a stream. Try to make the
41313d92 2941directory if it isn't there. */
059ec3d9 2942
41313d92 2943spool_name = spool_fname(US"input", message_subdir, message_id, US"-D");
a2da3176
JH
2944DEBUG(D_receive) debug_printf("Data file name: %s\n", spool_name);
2945
2946if ((data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE)) < 0)
059ec3d9
PH
2947 {
2948 if (errno == ENOENT)
2949 {
0971ec06 2950 (void) directory_make(spool_directory,
41313d92
JH
2951 spool_sname(US"input", message_subdir),
2952 INPUT_DIRECTORY_MODE, TRUE);
059ec3d9
PH
2953 data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE);
2954 }
2955 if (data_fd < 0)
2956 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Failed to create spool file %s: %s",
2957 spool_name, strerror(errno));
2958 }
2959
2960/* Make sure the file's group is the Exim gid, and double-check the mode
2961because the group setting doesn't always get set automatically. */
2962
1ac6b2e7
JH
2963if (fchown(data_fd, exim_uid, exim_gid))
2964 log_write(0, LOG_MAIN|LOG_PANIC_DIE,
2965 "Failed setting ownership on spool file %s: %s",
2966 spool_name, strerror(errno));
ff790e47 2967(void)fchmod(data_fd, SPOOL_MODE);
059ec3d9
PH
2968
2969/* We now have data file open. Build a stream for it and lock it. We lock only
2970the first line of the file (containing the message ID) because otherwise there
2971are problems when Exim is run under Cygwin (I'm told). See comments in
2972spool_in.c, where the same locking is done. */
2973
2974data_file = fdopen(data_fd, "w+");
2975lock_data.l_type = F_WRLCK;
2976lock_data.l_whence = SEEK_SET;
2977lock_data.l_start = 0;
2978lock_data.l_len = SPOOL_DATA_START_OFFSET;
2979
2980if (fcntl(data_fd, F_SETLK, &lock_data) < 0)
2981 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Cannot lock %s (%d): %s", spool_name,
2982 errno, strerror(errno));
2983
2984/* We have an open, locked data file. Write the message id to it to make it
2985self-identifying. Then read the remainder of the input of this message and
2986write it to the data file. If the variable next != NULL, it contains the first
2987data line (which was read as a header but then turned out not to have the right
2988format); write it (remembering that it might contain binary zeros). The result
2989of fwrite() isn't inspected; instead we call ferror() below. */
2990
2991fprintf(data_file, "%s-D\n", message_id);
2992if (next != NULL)
2993 {
2994 uschar *s = next->text;
2995 int len = next->slen;
1ac6b2e7 2996 len = fwrite(s, 1, len, data_file); len = len; /* compiler quietening */
059ec3d9
PH
2997 body_linecount++; /* Assumes only 1 line */
2998 }
2999
3000/* Note that we might already be at end of file, or the logical end of file
3001(indicated by '.'), or might have encountered an error while writing the
3002message id or "next" line. */
3003
3004if (!ferror(data_file) && !(receive_feof)() && message_ended != END_DOT)
3005 {
3006 if (smtp_input)
3007 {
7e3ce68e
JH
3008 message_ended = chunking_state > CHUNKING_OFFERED
3009 ? read_message_bdat_smtp(data_file)
3010 : read_message_data_smtp(data_file);
059ec3d9
PH
3011 receive_linecount++; /* The terminating "." line */
3012 }
3013 else message_ended = read_message_data(data_file);
3014
3015 receive_linecount += body_linecount; /* For BSMTP errors mainly */
2e0c1448 3016 message_linecount += body_linecount;
059ec3d9 3017
7e3ce68e 3018 switch (message_ended)
059ec3d9 3019 {
7e3ce68e 3020 /* Handle premature termination of SMTP */
059ec3d9 3021
7e3ce68e
JH
3022 case END_EOF:
3023 if (smtp_input)
3024 {
3025 Uunlink(spool_name); /* Lose data file when closed */
3026 cancel_cutthrough_connection("sender closed connection");
3027 message_id[0] = 0; /* Indicate no message accepted */
3028 smtp_reply = handle_lost_connection(US"");
3029 smtp_yield = FALSE;
3030 goto TIDYUP; /* Skip to end of function */
3031 }
3032 break;
059ec3d9 3033
7e3ce68e
JH
3034 /* Handle message that is too big. Don't use host_or_ident() in the log
3035 message; we want to see the ident value even for non-remote messages. */
059ec3d9 3036
7e3ce68e
JH
3037 case END_SIZE:
3038 Uunlink(spool_name); /* Lose the data file when closed */
3039 cancel_cutthrough_connection("mail too big");
3040 if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */
059ec3d9 3041
7e3ce68e
JH
3042 log_write(L_size_reject, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: "
3043 "message too big: read=%d max=%d",
3044 sender_address,
3045 (sender_fullhost == NULL)? "" : " H=",
3046 (sender_fullhost == NULL)? US"" : sender_fullhost,
3047 (sender_ident == NULL)? "" : " U=",
3048 (sender_ident == NULL)? US"" : sender_ident,
3049 message_size,
3050 thismessage_size_limit);
3051
3052 if (smtp_input)
3053 {
3054 smtp_reply = US"552 Message size exceeds maximum permitted";
3055 message_id[0] = 0; /* Indicate no message accepted */
3056 goto TIDYUP; /* Skip to end of function */
3057 }
3058 else
3059 {
3060 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3061 give_local_error(ERRMESS_TOOBIG,
3062 string_sprintf("message too big (max=%d)", thismessage_size_limit),
3063 US"message rejected: ", error_rc, data_file, header_list);
3064 /* Does not return */
3065 }
3066 break;
3067
3068 /* Handle bad BDAT protocol sequence */
3069
3070 case END_PROTOCOL:
3071 Uunlink(spool_name); /* Lose the data file when closed */
3072 cancel_cutthrough_connection("sender protocol error");
3073 smtp_reply = US""; /* Response already sent */
3074 message_id[0] = 0; /* Indicate no message accepted */
3075 goto TIDYUP; /* Skip to end of function */
059ec3d9
PH
3076 }
3077 }
3078
3079/* Restore the standard SIGALRM handler for any subsequent processing. (For
3080example, there may be some expansion in an ACL that uses a timer.) */
3081
3082os_non_restarting_signal(SIGALRM, sigalrm_handler);
3083
3084/* The message body has now been read into the data file. Call fflush() to
3085empty the buffers in C, and then call fsync() to get the data written out onto
3086the disk, as fflush() doesn't do this (or at least, it isn't documented as
3087having to do this). If there was an I/O error on either input or output,
3088attempt to send an error message, and unlink the spool file. For non-SMTP input
3089we can then give up. Note that for SMTP input we must swallow the remainder of
3090the input in cases of output errors, since the far end doesn't expect to see
3091anything until the terminating dot line is sent. */
3092
3093if (fflush(data_file) == EOF || ferror(data_file) ||
54fc8428 3094 EXIMfsync(fileno(data_file)) < 0 || (receive_ferror)())
059ec3d9
PH
3095 {
3096 uschar *msg_errno = US strerror(errno);
3097 BOOL input_error = (receive_ferror)() != 0;
3098 uschar *msg = string_sprintf("%s error (%s) while receiving message from %s",
3099 input_error? "Input read" : "Spool write",
3100 msg_errno,
3101 (sender_fullhost != NULL)? sender_fullhost : sender_ident);
3102
3103 log_write(0, LOG_MAIN, "Message abandoned: %s", msg);
3104 Uunlink(spool_name); /* Lose the data file */
2e5b33cd 3105 cancel_cutthrough_connection("error writing spoolfile");
059ec3d9
PH
3106
3107 if (smtp_input)
3108 {
3109 if (input_error)
3110 smtp_reply = US"451 Error while reading input data";
3111 else
3112 {
3113 smtp_reply = US"451 Error while writing spool file";
3114 receive_swallow_smtp();
3115 }
3116 message_id[0] = 0; /* Indicate no message accepted */
3117 goto TIDYUP; /* Skip to end of function */
3118 }
3119
3120 else
3121 {
3122 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3123 give_local_error(ERRMESS_IOERR, msg, US"", error_rc, data_file,
3124 header_list);
3125 /* Does not return */
3126 }
3127 }
3128
3129
3130/* No I/O errors were encountered while writing the data file. */
3131
3132DEBUG(D_receive) debug_printf("Data file written for message %s\n", message_id);
3133
3134
3135/* If there were any bad addresses extracted by -t, or there were no recipients
3136left after -t, send a message to the sender of this message, or write it to
3137stderr if the error handling option is set that way. Note that there may
3138legitimately be no recipients for an SMTP message if they have all been removed
3139by "discard".
3140
3141We need to rewind the data file in order to read it. In the case of no
3142recipients or stderr error writing, throw the data file away afterwards, and
3143exit. (This can't be SMTP, which always ensures there's at least one
3144syntactically good recipient address.) */
3145
3146if (extract_recip && (bad_addresses != NULL || recipients_count == 0))
3147 {
3148 DEBUG(D_receive)
3149 {
3150 if (recipients_count == 0) debug_printf("*** No recipients\n");
3151 if (bad_addresses != NULL)
3152 {
3153 error_block *eblock = bad_addresses;
3154 debug_printf("*** Bad address(es)\n");
3155 while (eblock != NULL)
3156 {
3157 debug_printf(" %s: %s\n", eblock->text1, eblock->text2);
3158 eblock = eblock->next;
3159 }
3160 }
3161 }
3162
3163 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3164
3165 /* If configured to send errors to the sender, but this fails, force
3166 a failure error code. We use a special one for no recipients so that it
3167 can be detected by the autoreply transport. Otherwise error_rc is set to
3168 errors_sender_rc, which is EXIT_FAILURE unless -oee was given, in which case
3169 it is EXIT_SUCCESS. */
3170
3171 if (error_handling == ERRORS_SENDER)
3172 {
3173 if (!moan_to_sender(
3174 (bad_addresses == NULL)?
3175 (extracted_ignored? ERRMESS_IGADDRESS : ERRMESS_NOADDRESS) :
3176 (recipients_list == NULL)? ERRMESS_BADNOADDRESS : ERRMESS_BADADDRESS,
3177 bad_addresses, header_list, data_file, FALSE))
3178 error_rc = (bad_addresses == NULL)? EXIT_NORECIPIENTS : EXIT_FAILURE;
3179 }
3180 else
3181 {
3182 if (bad_addresses == NULL)
3183 {
3184 if (extracted_ignored)
3185 fprintf(stderr, "exim: all -t recipients overridden by command line\n");
3186 else
3187 fprintf(stderr, "exim: no recipients in message\n");
3188 }
3189 else
3190 {
3191 fprintf(stderr, "exim: invalid address%s",
3192 (bad_addresses->next == NULL)? ":" : "es:\n");
3193 while (bad_addresses != NULL)
3194 {
3195 fprintf(stderr, " %s: %s\n", bad_addresses->text1,
3196 bad_addresses->text2);
3197 bad_addresses = bad_addresses->next;
3198 }
3199 }
3200 }
3201
3202 if (recipients_count == 0 || error_handling == ERRORS_STDERR)
3203 {
3204 Uunlink(spool_name);
f1e894f3 3205 (void)fclose(data_file);
059ec3d9
PH
3206 exim_exit(error_rc);
3207 }
3208 }
3209
3210/* Data file successfully written. Generate text for the Received: header by
3211expanding the configured string, and adding a timestamp. By leaving this
3212operation till now, we ensure that the timestamp is the time that message
3213reception was completed. However, this is deliberately done before calling the
3214data ACL and local_scan().
3215
3216This Received: header may therefore be inspected by the data ACL and by code in
3217the local_scan() function. When they have run, we update the timestamp to be
3218the final time of reception.
3219
3220If there is just one recipient, set up its value in the $received_for variable
3221for use when we generate the Received: header.
3222
3223Note: the checking for too many Received: headers is handled by the delivery
3224code. */
e4bdf652 3225/*XXX eventually add excess Received: check for cutthrough case back when classifying them */
059ec3d9 3226
e4bdf652 3227if (received_header->text == NULL) /* Non-cutthrough case */
059ec3d9 3228 {
e4bdf652 3229 received_header_gen();
059ec3d9 3230
e4bdf652 3231 /* Set the value of message_body_size for the DATA ACL and for local_scan() */
059ec3d9 3232
e4bdf652
JH
3233 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3234 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9 3235
e4bdf652
JH
3236 /* If an ACL from any RCPT commands set up any warning headers to add, do so
3237 now, before running the DATA ACL. */
059ec3d9 3238
578d43dc 3239 add_acl_headers(ACL_WHERE_RCPT, US"MAIL or RCPT");
e4bdf652 3240 }
817d9f57 3241else
e4bdf652
JH
3242 message_body_size = (fstat(data_fd, &statbuf) == 0)?
3243 statbuf.st_size - SPOOL_DATA_START_OFFSET : -1;
059ec3d9
PH
3244
3245/* If an ACL is specified for checking things at this stage of reception of a
3246message, run it, unless all the recipients were removed by "discard" in earlier
3247ACLs. That is the only case in which recipients_count can be zero at this
3248stage. Set deliver_datafile to point to the data file so that $message_body and
3249$message_body_end can be extracted if needed. Allow $recipients in expansions.
3250*/
3251
3252deliver_datafile = data_fd;
4e88a19f 3253user_msg = NULL;
059ec3d9 3254
0e20aff9
MH
3255enable_dollar_recipients = TRUE;
3256
059ec3d9 3257if (recipients_count == 0)
7e3ce68e
JH
3258 blackholed_by = recipients_discarded ? US"MAIL ACL" : US"RCPT ACL";
3259
059ec3d9
PH
3260else
3261 {
059ec3d9
PH
3262 /* Handle interactive SMTP messages */
3263
3264 if (smtp_input && !smtp_batched_input)
3265 {
8523533c 3266
80a47a2c
TK
3267#ifndef DISABLE_DKIM
3268 if (!dkim_disable_verify)
3269 {
3270 /* Finish verification, this will log individual signature results to
3271 the mainlog */
3272 dkim_exim_verify_finish();
3273
3274 /* Check if we must run the DKIM ACL */
7e3ce68e 3275 if (acl_smtp_dkim && dkim_verify_signers && *dkim_verify_signers)
80a47a2c
TK
3276 {
3277 uschar *dkim_verify_signers_expanded =
3278 expand_string(dkim_verify_signers);
7e3ce68e 3279 if (!dkim_verify_signers_expanded)
80a47a2c
TK
3280 log_write(0, LOG_MAIN|LOG_PANIC,
3281 "expansion of dkim_verify_signers option failed: %s",
3282 expand_string_message);
7e3ce68e 3283
80a47a2c
TK
3284 else
3285 {
3286 int sep = 0;
55414b25 3287 const uschar *ptr = dkim_verify_signers_expanded;
80a47a2c 3288 uschar *item = NULL;
9e5d6b55
TK
3289 uschar *seen_items = NULL;
3290 int seen_items_size = 0;
3291 int seen_items_offset = 0;
9122af94
TK
3292 /* Default to OK when no items are present */
3293 rc = OK;
7e3ce68e 3294 while ((item = string_nextinlist(&ptr, &sep, NULL, 0)))
80a47a2c 3295 {
6119d1ea 3296 /* Prevent running ACL for an empty item */
7e3ce68e 3297 if (!item || !*item) continue;
5032d1cf
JH
3298
3299 /* Only run ACL once for each domain or identity,
3300 no matter how often it appears in the expanded list. */
3301 if (seen_items)
6119d1ea 3302 {
ae9094bf 3303 uschar *seen_item = NULL;
55414b25 3304 const uschar *seen_items_list = seen_items;
5032d1cf 3305 BOOL seen_this_item = FALSE;
61147df4 3306
ae9094bf 3307 while ((seen_item = string_nextinlist(&seen_items_list, &sep,
7e3ce68e 3308 NULL, 0)))
5032d1cf
JH
3309 if (Ustrcmp(seen_item,item) == 0)
3310 {
3311 seen_this_item = TRUE;
3312 break;
3313 }
3314
3315 if (seen_this_item)
6119d1ea
TK
3316 {
3317 DEBUG(D_receive)
5032d1cf
JH
3318 debug_printf("acl_smtp_dkim: skipping signer %s, "
3319 "already seen\n", item);
6119d1ea
TK
3320 continue;
3321 }
61147df4 3322
5032d1cf
JH
3323 seen_items = string_append(seen_items, &seen_items_size,
3324 &seen_items_offset, 1, ":");
6119d1ea
TK
3325 }
3326
5032d1cf
JH
3327 seen_items = string_append(seen_items, &seen_items_size,
3328 &seen_items_offset, 1, item);
4a73449b 3329 seen_items[seen_items_offset] = '\0';
6119d1ea
TK
3330
3331 DEBUG(D_receive)
5032d1cf
JH
3332 debug_printf("calling acl_smtp_dkim for dkim_cur_signer=%s\n",
3333 item);
6119d1ea 3334
80a47a2c 3335 dkim_exim_acl_setup(item);
5032d1cf
JH
3336 rc = acl_check(ACL_WHERE_DKIM, NULL, acl_smtp_dkim,
3337 &user_msg, &log_msg);
6119d1ea
TK
3338
3339 if (rc != OK)
5032d1cf
JH
3340 {
3341 DEBUG(D_receive)
3342 debug_printf("acl_smtp_dkim: acl_check returned %d on %s, "
3343 "skipping remaining items\n", rc, item);
3344 cancel_cutthrough_connection("dkim acl not ok");
3345 break;
3346 }
80a47a2c 3347 }
578d43dc 3348 add_acl_headers(ACL_WHERE_DKIM, US"DKIM");
80a47a2c
TK
3349 if (rc == DISCARD)
3350 {
3351 recipients_count = 0;
3352 blackholed_by = US"DKIM ACL";
3353 if (log_msg != NULL)
3354 blackhole_log_msg = string_sprintf(": %s", log_msg);
3355 }
3356 else if (rc != OK)
3357 {
3358 Uunlink(spool_name);
3359 if (smtp_handle_acl_fail(ACL_WHERE_DKIM, rc, user_msg, log_msg) != 0)
85ffcba6 3360 smtp_yield = FALSE; /* No more messages after dropped connection */
80a47a2c
TK
3361 smtp_reply = US""; /* Indicate reply already sent */
3362 message_id[0] = 0; /* Indicate no message accepted */
3363 goto TIDYUP; /* Skip to end of function */
3364 }
3365 }
3366 }
3367 }
4a8ce2d8 3368#endif /* DISABLE_DKIM */
fb2274d4 3369
8523533c 3370#ifdef WITH_CONTENT_SCAN
80a47a2c
TK
3371 if (recipients_count > 0 &&
3372 acl_smtp_mime != NULL &&
54cdb463
PH
3373 !run_mime_acl(acl_smtp_mime, &smtp_yield, &smtp_reply, &blackholed_by))
3374 goto TIDYUP;
8523533c
TK
3375#endif /* WITH_CONTENT_SCAN */
3376
4840604e
TL
3377#ifdef EXPERIMENTAL_DMARC
3378 dmarc_up = dmarc_store_data(from_header);
3379#endif /* EXPERIMENTAL_DMARC */
3380
8ccd00b1
JH
3381#ifndef DISABLE_PRDR
3382 if (prdr_requested && recipients_count > 1 && acl_smtp_data_prdr)
fd98a5c6
JH
3383 {
3384 unsigned int c;
3385 int all_pass = OK;
3386 int all_fail = FAIL;
3387
3388 smtp_printf("353 PRDR content analysis beginning\r\n");
3389 /* Loop through recipients, responses must be in same order received */
3390 for (c = 0; recipients_count > c; c++)
3391 {
3392 uschar * addr= recipients_list[c].address;
3393 uschar * msg= US"PRDR R=<%s> %s";
3394 uschar * code;
3395 DEBUG(D_receive)
3396 debug_printf("PRDR processing recipient %s (%d of %d)\n",
3397 addr, c+1, recipients_count);
3398 rc = acl_check(ACL_WHERE_PRDR, addr,
3399 acl_smtp_data_prdr, &user_msg, &log_msg);
3400
3401 /* If any recipient rejected content, indicate it in final message */
3402 all_pass |= rc;
3403 /* If all recipients rejected, indicate in final message */
3404 all_fail &= rc;
3405
3406 switch (rc)
3407 {
3408 case OK: case DISCARD: code = US"250"; break;
3409 case DEFER: code = US"450"; break;
3410 default: code = US"550"; break;
3411 }
3412 if (user_msg != NULL)
3413 smtp_user_msg(code, user_msg);
3414 else
3415 {
3416 switch (rc)
3417 {
3418 case OK: case DISCARD:
3419 msg = string_sprintf(CS msg, addr, "acceptance"); break;
3420 case DEFER:
3421 msg = string_sprintf(CS msg, addr, "temporary refusal"); break;
3422 default:
3423 msg = string_sprintf(CS msg, addr, "refusal"); break;
3424 }
3425 smtp_user_msg(code, msg);
3426 }
3427 if (log_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, log_msg);
3428 else if (user_msg) log_write(0, LOG_MAIN, "PRDR %s %s", addr, user_msg);
112b6a93 3429 else log_write(0, LOG_MAIN, "%s", CS msg);
fd98a5c6
JH
3430
3431 if (rc != OK) { receive_remove_recipient(addr); c--; }
3432 }
3433 /* Set up final message, used if data acl gives OK */
3434 smtp_reply = string_sprintf("%s id=%s message %s",
3435 all_fail == FAIL ? US"550" : US"250",
3436 message_id,
3437 all_fail == FAIL
3438 ? US"rejected for all recipients"
3439 : all_pass == OK
3440 ? US"accepted"
3441 : US"accepted for some recipients");
3442 if (recipients_count == 0)
3443 {
3444 message_id[0] = 0; /* Indicate no message accepted */
3445 goto TIDYUP;
3446 }
3447 }
3448 else
3449 prdr_requested = FALSE;
8ccd00b1 3450#endif /* !DISABLE_PRDR */
fd98a5c6 3451
54cdb463
PH
3452 /* Check the recipients count again, as the MIME ACL might have changed
3453 them. */
8523533c 3454
059ec3d9
PH
3455 if (acl_smtp_data != NULL && recipients_count > 0)
3456 {
059ec3d9 3457 rc = acl_check(ACL_WHERE_DATA, NULL, acl_smtp_data, &user_msg, &log_msg);
578d43dc 3458 add_acl_headers(ACL_WHERE_DATA, US"DATA");
059ec3d9
PH
3459 if (rc == DISCARD)
3460 {
3461 recipients_count = 0;
3462 blackholed_by = US"DATA ACL";
8e669ac1
PH
3463 if (log_msg != NULL)
3464 blackhole_log_msg = string_sprintf(": %s", log_msg);
2e5b33cd 3465 cancel_cutthrough_connection("data acl discard");
059ec3d9
PH
3466 }
3467 else if (rc != OK)
3468 {
3469 Uunlink(spool_name);
2e5b33cd 3470 cancel_cutthrough_connection("data acl not ok");
8523533c
TK
3471#ifdef WITH_CONTENT_SCAN
3472 unspool_mbox();
6f0c431a
PP
3473#endif
3474#ifdef EXPERIMENTAL_DCC
3475 dcc_ok = 0;
8523533c 3476#endif
059ec3d9 3477 if (smtp_handle_acl_fail(ACL_WHERE_DATA, rc, user_msg, log_msg) != 0)
85ffcba6 3478 smtp_yield = FALSE; /* No more messages after dropped connection */
059ec3d9
PH
3479 smtp_reply = US""; /* Indicate reply already sent */
3480 message_id[0] = 0; /* Indicate no message accepted */
3481 goto TIDYUP; /* Skip to end of function */
3482 }
3483 }
3484 }
3485
3486 /* Handle non-SMTP and batch SMTP (i.e. non-interactive) messages. Note that
3487 we cannot take different actions for permanent and temporary rejections. */
3488
54cdb463 3489 else
059ec3d9 3490 {
54cdb463
PH
3491
3492#ifdef WITH_CONTENT_SCAN
3493 if (acl_not_smtp_mime != NULL &&
3494 !run_mime_acl(acl_not_smtp_mime, &smtp_yield, &smtp_reply,
3495 &blackholed_by))
3496 goto TIDYUP;
3497#endif /* WITH_CONTENT_SCAN */
3498
3499 if (acl_not_smtp != NULL)
059ec3d9 3500 {
54cdb463
PH
3501 uschar *user_msg, *log_msg;
3502 rc = acl_check(ACL_WHERE_NOTSMTP, NULL, acl_not_smtp, &user_msg, &log_msg);
3503 if (rc == DISCARD)
059ec3d9 3504 {
54cdb463
PH
3505 recipients_count = 0;
3506 blackholed_by = US"non-SMTP ACL";
3507 if (log_msg != NULL)
3508 blackhole_log_msg = string_sprintf(": %s", log_msg);
059ec3d9 3509 }
54cdb463 3510 else if (rc != OK)
059ec3d9 3511 {
54cdb463
PH
3512 Uunlink(spool_name);
3513#ifdef WITH_CONTENT_SCAN
3514 unspool_mbox();
6f0c431a
PP
3515#endif
3516#ifdef EXPERIMENTAL_DCC
3517 dcc_ok = 0;
54cdb463 3518#endif
6ea85e9a
PH
3519 /* The ACL can specify where rejections are to be logged, possibly
3520 nowhere. The default is main and reject logs. */
3521
3522 if (log_reject_target != 0)
3523 log_write(0, log_reject_target, "F=<%s> rejected by non-SMTP ACL: %s",
3524 sender_address, log_msg);
3525
54cdb463
PH
3526 if (user_msg == NULL) user_msg = US"local configuration problem";
3527 if (smtp_batched_input)
3528 {
3529 moan_smtp_batch(NULL, "%d %s", 550, user_msg);
3530 /* Does not return */
3531 }
3532 else
3533 {
3534 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3535 give_local_error(ERRMESS_LOCAL_ACL, user_msg,
3536 US"message rejected by non-SMTP ACL: ", error_rc, data_file,
3537 header_list);
3538 /* Does not return */
3539 }
059ec3d9 3540 }
578d43dc 3541 add_acl_headers(ACL_WHERE_NOTSMTP, US"non-SMTP");
059ec3d9 3542 }
059ec3d9
PH
3543 }
3544
54cdb463
PH
3545 /* The applicable ACLs have been run */
3546
059ec3d9
PH
3547 if (deliver_freeze) frozen_by = US"ACL"; /* for later logging */
3548 if (queue_only_policy) queued_by = US"ACL";
059ec3d9
PH
3549 }
3550
8523533c
TK
3551#ifdef WITH_CONTENT_SCAN
3552unspool_mbox();
3553#endif
3554
6a8f9482
TK
3555#ifdef EXPERIMENTAL_DCC
3556dcc_ok = 0;
3557#endif
3558
3559
059ec3d9
PH
3560/* The final check on the message is to run the scan_local() function. The
3561version supplied with Exim always accepts, but this is a hook for sysadmins to
3562supply their own checking code. The local_scan() function is run even when all
3563the recipients have been discarded. */
3564
3565lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3566
3567/* Arrange to catch crashes in local_scan(), so that the -D file gets
3568deleted, and the incident gets logged. */
3569
3570os_non_restarting_signal(SIGSEGV, local_scan_crash_handler);
3571os_non_restarting_signal(SIGFPE, local_scan_crash_handler);
3572os_non_restarting_signal(SIGILL, local_scan_crash_handler);
3573os_non_restarting_signal(SIGBUS, local_scan_crash_handler);
3574
3575DEBUG(D_receive) debug_printf("calling local_scan(); timeout=%d\n",
3576 local_scan_timeout);
3577local_scan_data = NULL;
3578
3579os_non_restarting_signal(SIGALRM, local_scan_timeout_handler);
3580if (local_scan_timeout > 0) alarm(local_scan_timeout);
3581rc = local_scan(data_fd, &local_scan_data);
3582alarm(0);
3583os_non_restarting_signal(SIGALRM, sigalrm_handler);
3584
0e20aff9
MH
3585enable_dollar_recipients = FALSE;
3586
059ec3d9
PH
3587store_pool = POOL_MAIN; /* In case changed */
3588DEBUG(D_receive) debug_printf("local_scan() returned %d %s\n", rc,
3589 local_scan_data);
3590
3591os_non_restarting_signal(SIGSEGV, SIG_DFL);
3592os_non_restarting_signal(SIGFPE, SIG_DFL);
3593os_non_restarting_signal(SIGILL, SIG_DFL);
3594os_non_restarting_signal(SIGBUS, SIG_DFL);
3595
3596/* The length check is paranoia against some runaway code, and also because
3597(for a success return) lines in the spool file are read into big_buffer. */
3598
3599if (local_scan_data != NULL)
3600 {
3601 int len = Ustrlen(local_scan_data);
3602 if (len > LOCAL_SCAN_MAX_RETURN) len = LOCAL_SCAN_MAX_RETURN;
3603 local_scan_data = string_copyn(local_scan_data, len);
3604 }
3605
3606if (rc == LOCAL_SCAN_ACCEPT_FREEZE)
3607 {
58eb016e 3608 if (!deliver_freeze) /* ACL might have already frozen */
059ec3d9
PH
3609 {
3610 deliver_freeze = TRUE;
3611 deliver_frozen_at = time(NULL);
3612 frozen_by = US"local_scan()";
3613 }
3614 rc = LOCAL_SCAN_ACCEPT;
3615 }
3616else if (rc == LOCAL_SCAN_ACCEPT_QUEUE)
3617 {
3618 if (!queue_only_policy) /* ACL might have already queued */
3619 {
3620 queue_only_policy = TRUE;
3621 queued_by = US"local_scan()";
3622 }
3623 rc = LOCAL_SCAN_ACCEPT;
3624 }
3625
3626/* Message accepted: remove newlines in local_scan_data because otherwise
3627the spool file gets corrupted. Ensure that all recipients are qualified. */
3628
3629if (rc == LOCAL_SCAN_ACCEPT)
3630 {
3631 if (local_scan_data != NULL)
3632 {
3633 uschar *s;
3634 for (s = local_scan_data; *s != 0; s++) if (*s == '\n') *s = ' ';
3635 }
3636 for (i = 0; i < recipients_count; i++)
3637 {
3638 recipient_item *r = recipients_list + i;
3639 r->address = rewrite_address_qualify(r->address, TRUE);
3640 if (r->errors_to != NULL)
3641 r->errors_to = rewrite_address_qualify(r->errors_to, TRUE);
3642 }
3643 if (recipients_count == 0 && blackholed_by == NULL)
3644 blackholed_by = US"local_scan";
3645 }
3646
3647/* Message rejected: newlines permitted in local_scan_data to generate
3648multiline SMTP responses. */
3649
3650else
3651 {
3652 uschar *istemp = US"";
3653 uschar *s = NULL;
a5bd321b 3654 uschar *smtp_code;
059ec3d9
PH
3655 int size = 0;
3656 int sptr = 0;
059ec3d9
PH
3657
3658 errmsg = local_scan_data;
3659
3660 Uunlink(spool_name); /* Cancel this message */
3661 switch(rc)
3662 {
3663 default:
3664 log_write(0, LOG_MAIN, "invalid return %d from local_scan(). Temporary "
3665 "rejection given", rc);
3666 goto TEMPREJECT;
3667
3668 case LOCAL_SCAN_REJECT_NOLOGHDR:
6c6d6e48 3669 BIT_CLEAR(log_selector, log_selector_size, Li_rejected_header);
059ec3d9
PH
3670 /* Fall through */
3671
3672 case LOCAL_SCAN_REJECT:
a5bd321b 3673 smtp_code = US"550";
059ec3d9
PH
3674 if (errmsg == NULL) errmsg = US"Administrative prohibition";
3675 break;
3676
3677 case LOCAL_SCAN_TEMPREJECT_NOLOGHDR:
6c6d6e48 3678 BIT_CLEAR(log_selector, log_selector_size, Li_rejected_header);
059ec3d9
PH
3679 /* Fall through */
3680
3681 case LOCAL_SCAN_TEMPREJECT:
3682 TEMPREJECT:
a5bd321b 3683 smtp_code = US"451";
059ec3d9
PH
3684 if (errmsg == NULL) errmsg = US"Temporary local problem";
3685 istemp = US"temporarily ";
3686 break;
3687 }
3688
3689 s = string_append(s, &size, &sptr, 2, US"F=",
3690 (sender_address[0] == 0)? US"<>" : sender_address);
3691 s = add_host_info_for_log(s, &size, &sptr);
3692 s[sptr] = 0;
3693
3694 log_write(0, LOG_MAIN|LOG_REJECT, "%s %srejected by local_scan(): %.256s",
3695 s, istemp, string_printing(errmsg));
3696
3697 if (smtp_input)
3698 {
3699 if (!smtp_batched_input)
3700 {
a5bd321b 3701 smtp_respond(smtp_code, 3, TRUE, errmsg);
059ec3d9
PH
3702 message_id[0] = 0; /* Indicate no message accepted */
3703 smtp_reply = US""; /* Indicate reply already sent */
3704 goto TIDYUP; /* Skip to end of function */
3705 }
3706 else
3707 {
a5bd321b 3708 moan_smtp_batch(NULL, "%s %s", smtp_code, errmsg);
059ec3d9
PH
3709 /* Does not return */
3710 }
3711 }
3712 else
3713 {
3714 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3715 give_local_error(ERRMESS_LOCAL_SCAN, errmsg,
3716 US"message rejected by local scan code: ", error_rc, data_file,
3717 header_list);
3718 /* Does not return */
3719 }
3720 }
3721
3722/* Reset signal handlers to ignore signals that previously would have caused
3723the message to be abandoned. */
3724
3725signal(SIGTERM, SIG_IGN);
3726signal(SIGINT, SIG_IGN);
3727
e4bdf652 3728
059ec3d9
PH
3729/* Ensure the first time flag is set in the newly-received message. */
3730
3731deliver_firsttime = TRUE;
3732
8523533c 3733#ifdef EXPERIMENTAL_BRIGHTMAIL
a2da3176
JH
3734if (bmi_run == 1)
3735 { /* rewind data file */
8523533c
TK
3736 lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3737 bmi_verdicts = bmi_process_message(header_list, data_fd);
a2da3176 3738 }
8523533c
TK
3739#endif
3740
4c04137d 3741/* Update the timestamp in our Received: header to account for any time taken by
059ec3d9
PH
3742an ACL or by local_scan(). The new time is the time that all reception
3743processing is complete. */
3744
3745timestamp = expand_string(US"${tod_full}");
3746tslen = Ustrlen(timestamp);
3747
3748memcpy(received_header->text + received_header->slen - tslen - 1,
3749 timestamp, tslen);
3750
3751/* In MUA wrapper mode, ignore queueing actions set by ACL or local_scan() */
3752
3753if (mua_wrapper)
3754 {
3755 deliver_freeze = FALSE;
3756 queue_only_policy = FALSE;
3757 }
3758
3759/* Keep the data file open until we have written the header file, in order to
3760hold onto the lock. In a -bh run, or if the message is to be blackholed, we
3761don't write the header file, and we unlink the data file. If writing the header
3762file fails, we have failed to accept this message. */
3763
3764if (host_checking || blackholed_by != NULL)
3765 {
3766 header_line *h;
3767 Uunlink(spool_name);
3768 msg_size = 0; /* Compute size for log line */
3769 for (h = header_list; h != NULL; h = h->next)
3770 if (h->type != '*') msg_size += h->slen;
3771 }
3772
3773/* Write the -H file */
3774
3775else
059ec3d9
PH
3776 if ((msg_size = spool_write_header(message_id, SW_RECEIVING, &errmsg)) < 0)
3777 {
3778 log_write(0, LOG_MAIN, "Message abandoned: %s", errmsg);
3779 Uunlink(spool_name); /* Lose the data file */
3780
3781 if (smtp_input)
3782 {
3783 smtp_reply = US"451 Error in writing spool file";
3784 message_id[0] = 0; /* Indicate no message accepted */
3785 goto TIDYUP;
3786 }
3787 else
3788 {
3789 fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET);
3790 give_local_error(ERRMESS_IOERR, errmsg, US"", error_rc, data_file,
3791 header_list);
3792 /* Does not return */
3793 }
3794 }
059ec3d9
PH
3795
3796
3797/* The message has now been successfully received. */
3798
3799receive_messagecount++;
3800
3801/* In SMTP sessions we may receive several in one connection. After each one,
3802we wait for the clock to tick at the level of message-id granularity. This is
3803so that the combination of time+pid is unique, even on systems where the pid
3804can be re-used within our time interval. We can't shorten the interval without
3805re-designing the message-id. See comments above where the message id is
3806created. This is Something For The Future. */
3807
3808message_id_tv.tv_usec = (message_id_tv.tv_usec/id_resolution) * id_resolution;
3809exim_wait_tick(&message_id_tv, id_resolution);
3810
3811/* Add data size to written header size. We do not count the initial file name
3812that is in the file, but we do add one extra for the notional blank line that
3813precedes the data. This total differs from message_size in that it include the
3814added Received: header and any other headers that got created locally. */
3815
3816fflush(data_file);
3817fstat(data_fd, &statbuf);
3818
3819msg_size += statbuf.st_size - SPOOL_DATA_START_OFFSET + 1;
3820
3821/* Generate a "message received" log entry. We do this by building up a dynamic
3822string as required. Since we commonly want to add two items at a time, use a
3823macro to simplify the coding. We log the arrival of a new message while the
3824file is still locked, just in case the machine is *really* fast, and delivers
3825it first! Include any message id that is in the message - since the syntax of a
4c04137d 3826message id is actually an addr-spec, we can use the parse routine to canonicalize
059ec3d9
PH
3827it. */
3828
3829size = 256;
3830sptr = 0;
3831s = store_get(size);
3832
27b9e5f4
JH
3833s = string_append(s, &size, &sptr, 2,
3834 fake_response == FAIL ? US"(= " : US"<= ",
3835 sender_address[0] == 0 ? US"<>" : sender_address);
3836if (message_reference)
059ec3d9
PH
3837 s = string_append(s, &size, &sptr, 2, US" R=", message_reference);
3838
3839s = add_host_info_for_log(s, &size, &sptr);
3840
3841#ifdef SUPPORT_TLS
6c6d6e48 3842if (LOGGING(tls_cipher) && tls_in.cipher)
817d9f57 3843 s = string_append(s, &size, &sptr, 2, US" X=", tls_in.cipher);
6c6d6e48 3844if (LOGGING(tls_certificate_verified) && tls_in.cipher)
059ec3d9 3845 s = string_append(s, &size, &sptr, 2, US" CV=",
27b9e5f4 3846 tls_in.certificate_verified ? "yes":"no");
6c6d6e48 3847if (LOGGING(tls_peerdn) && tls_in.peerdn)
48ed62d9 3848 s = string_append(s, &size, &sptr, 3, US" DN=\"",
817d9f57 3849 string_printing(tls_in.peerdn), US"\"");
6c6d6e48 3850if (LOGGING(tls_sni) && tls_in.sni)
3f0945ff 3851 s = string_append(s, &size, &sptr, 3, US" SNI=\"",
817d9f57 3852 string_printing(tls_in.sni), US"\"");
3f0945ff 3853#endif
059ec3d9 3854
8ccd00b1 3855if (sender_host_authenticated)
059ec3d9
PH
3856 {
3857 s = string_append(s, &size, &sptr, 2, US" A=", sender_host_authenticated);
27b9e5f4 3858 if (authenticated_id)
c8e2fc1e 3859 {
059ec3d9 3860 s = string_append(s, &size, &sptr, 2, US":", authenticated_id);
27b9e5f4 3861 if (LOGGING(smtp_mailauth) && authenticated_sender)
c8e2fc1e
JH
3862 s = string_append(s, &size, &sptr, 2, US":", authenticated_sender);
3863 }
059ec3d9
PH
3864 }
3865
8ccd00b1 3866#ifndef DISABLE_PRDR
fd98a5c6 3867if (prdr_requested)
7e3ce68e 3868 s = string_catn(s, &size, &sptr, US" PRDR", 5);
fd98a5c6 3869#endif
8ccd00b1 3870
cee5f132 3871#ifdef SUPPORT_PROXY
6c6d6e48 3872if (proxy_session && LOGGING(proxy))
e6d2a989 3873 s = string_append(s, &size, &sptr, 2, US" PRX=", proxy_local_address);
a3c86431 3874#endif
fd98a5c6 3875
7e3ce68e
JH
3876if (chunking_state > CHUNKING_OFFERED)
3877 s = string_catn(s, &size, &sptr, US" K", 2);
3878
059ec3d9
PH
3879sprintf(CS big_buffer, "%d", msg_size);
3880s = string_append(s, &size, &sptr, 2, US" S=", big_buffer);
3881
3c0a92dc
JH
3882/* log 8BITMIME mode announced in MAIL_FROM
3883 0 ... no BODY= used
3884 7 ... 7BIT
3885 8 ... 8BITMIME */
6c6d6e48 3886if (LOGGING(8bitmime))
c8e2fc1e 3887 {
3c0a92dc
JH
3888 sprintf(CS big_buffer, "%d", body_8bitmime);
3889 s = string_append(s, &size, &sptr, 2, US" M8S=", big_buffer);
c8e2fc1e 3890 }
3c0a92dc 3891
afa6d3ad
JH
3892if (*queue_name)
3893 s = string_append(s, &size, &sptr, 2, US" Q=", queue_name);
3894
059ec3d9
PH
3895/* If an addr-spec in a message-id contains a quoted string, it can contain
3896any characters except " \ and CR and so in particular it can contain NL!
3897Therefore, make sure we use a printing-characters only version for the log.
3898Also, allow for domain literals in the message id. */
3899
27b9e5f4 3900if (msgid_header)
059ec3d9
PH
3901 {
3902 uschar *old_id;
3903 BOOL save_allow_domain_literals = allow_domain_literals;
3904 allow_domain_literals = TRUE;
3905 old_id = parse_extract_address(Ustrchr(msgid_header->text, ':') + 1,
3906 &errmsg, &start, &end, &domain, FALSE);
3907 allow_domain_literals = save_allow_domain_literals;
3908 if (old_id != NULL)
3909 s = string_append(s, &size, &sptr, 2, US" id=", string_printing(old_id));
3910 }
3911
3912/* If subject logging is turned on, create suitable printing-character
3913text. By expanding $h_subject: we make use of the MIME decoding. */
3914
6c6d6e48 3915if (LOGGING(subject) && subject_header != NULL)
059ec3d9
PH
3916 {
3917 int i;
3918 uschar *p = big_buffer;
3919 uschar *ss = expand_string(US"$h_subject:");
3920
3921 /* Backslash-quote any double quotes or backslashes so as to make a
3922 a C-like string, and turn any non-printers into escape sequences. */
3923
3924 *p++ = '\"';
3925 if (*ss != 0) for (i = 0; i < 100 && ss[i] != 0; i++)
3926 {
3927 if (ss[i] == '\"' || ss[i] == '\\') *p++ = '\\';
3928 *p++ = ss[i];
3929 }
3930 *p++ = '\"';
3931 *p = 0;
3932 s = string_append(s, &size, &sptr, 2, US" T=", string_printing(big_buffer));
3933 }
3934
3935/* Terminate the string: string_cat() and string_append() leave room, but do
3936not put the zero in. */
3937
3938s[sptr] = 0;
3939
059ec3d9
PH
3940/* Create a message log file if message logs are being used and this message is
3941not blackholed. Write the reception stuff to it. We used to leave message log
e4bdf652 3942creation until the first delivery, but this has proved confusing for some
059ec3d9
PH
3943people. */
3944
3945if (message_logs && blackholed_by == NULL)
3946 {
3947 int fd;
3948
41313d92 3949 spool_name = spool_fname(US"msglog", message_subdir, message_id, US"");
a2da3176
JH
3950
3951 if ( (fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE)) < 0
3952 && errno == ENOENT
3953 )
059ec3d9 3954 {
41313d92
JH
3955 (void)directory_make(spool_directory,
3956 spool_sname(US"msglog", message_subdir),
3957 MSGLOG_DIRECTORY_MODE, TRUE);
059ec3d9
PH
3958 fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE);
3959 }
3960
3961 if (fd < 0)
3962 {
3963 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't open message log %s: %s",
3964 spool_name, strerror(errno));
3965 }
3966
3967 else
3968 {
3969 FILE *message_log = fdopen(fd, "a");
3970 if (message_log == NULL)
3971 {
3972 log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't fdopen message log %s: %s",
3973 spool_name, strerror(errno));
f1e894f3 3974 (void)close(fd);
059ec3d9
PH
3975 }
3976 else
3977 {
3978 uschar *now = tod_stamp(tod_log);
3979 fprintf(message_log, "%s Received from %s\n", now, s+3);
3980 if (deliver_freeze) fprintf(message_log, "%s frozen by %s\n", now,
3981 frozen_by);
3982 if (queue_only_policy) fprintf(message_log,
e8012beb
JH
3983 "%s no immediate delivery: queued%s%s by %s\n", now,
3984 *queue_name ? " in " : "", *queue_name ? CS queue_name : "",
3985 queued_by);
f1e894f3 3986 (void)fclose(message_log);
059ec3d9
PH
3987 }
3988 }
3989 }
3990
58eb016e
PH
3991/* Everything has now been done for a successful message except logging its
3992arrival, and outputting an SMTP response. While writing to the log, set a flag
3993to cause a call to receive_bomb_out() if the log cannot be opened. */
3994
3995receive_call_bombout = TRUE;
3996
563b63fa
PH
3997/* Before sending an SMTP response in a TCP/IP session, we check to see if the
3998connection has gone away. This can only be done if there is no unconsumed input
3999waiting in the local input buffer. We can test for this by calling
4000receive_smtp_buffered(). RFC 2920 (pipelining) explicitly allows for additional
4001input to be sent following the final dot, so the presence of following input is
4002not an error.
58eb016e 4003
563b63fa
PH
4004If the connection is still present, but there is no unread input for the
4005socket, the result of a select() call will be zero. If, however, the connection
4006has gone away, or if there is pending input, the result of select() will be
4007non-zero. The two cases can be distinguished by trying to read the next input
4008character. If we succeed, we can unread it so that it remains in the local
4009buffer for handling later. If not, the connection has been lost.
58eb016e 4010
563b63fa
PH
4011Of course, since TCP/IP is asynchronous, there is always a chance that the
4012connection will vanish between the time of this test and the sending of the
4013response, but the chance of this happening should be small. */
4014
4015if (smtp_input && sender_host_address != NULL && !sender_host_notsocket &&
4016 !receive_smtp_buffered())
58eb016e
PH
4017 {
4018 struct timeval tv;
4019 fd_set select_check;
4020 FD_ZERO(&select_check);
4021 FD_SET(fileno(smtp_in), &select_check);
4022 tv.tv_sec = 0;
4023 tv.tv_usec = 0;
4024
563b63fa 4025 if (select(fileno(smtp_in) + 1, &select_check, NULL, NULL, &tv) != 0)
58eb016e 4026 {
80a47a2c
TK
4027 int c = (receive_getc)();
4028 if (c != EOF) (receive_ungetc)(c); else
58eb016e 4029 {
eea0defe 4030 smtp_notquit_exit(US"connection-lost", NULL, NULL);
563b63fa
PH
4031 smtp_reply = US""; /* No attempt to send a response */
4032 smtp_yield = FALSE; /* Nothing more on this connection */
58eb016e 4033
563b63fa 4034 /* Re-use the log line workspace */
58eb016e 4035
563b63fa 4036 sptr = 0;
eea0defe 4037 s = string_cat(s, &size, &sptr, US"SMTP connection lost after final dot");
563b63fa
PH
4038 s = add_host_info_for_log(s, &size, &sptr);
4039 s[sptr] = 0;
4040 log_write(0, LOG_MAIN, "%s", s);
58eb016e 4041
563b63fa 4042 /* Delete the files for this aborted message. */
58eb016e 4043
41313d92
JH
4044 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-D"));
4045 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-H"));
4046 Uunlink(spool_fname(US"msglog", message_subdir, message_id, US""));
58eb016e 4047
563b63fa
PH
4048 goto TIDYUP;
4049 }
58eb016e
PH
4050 }
4051 }
4052
4053/* The connection has not gone away; we really are going to take responsibility
4054for this message. */
4055
817d9f57 4056/* Cutthrough - had sender last-dot; assume we've sent (or bufferred) all
e4bdf652
JH
4057 data onward by now.
4058
817d9f57 4059 Send dot onward. If accepted, wipe the spooled files, log as delivered and accept
e4bdf652 4060 the sender's dot (below).
4c04137d 4061 If rejected: copy response to sender, wipe the spooled files, log appropriately.
ff5929e3
JH
4062 If temp-reject: normally accept to sender, keep the spooled file - unless defer=pass
4063 in which case pass temp-reject back to initiator and dump the files.
e4bdf652
JH
4064
4065 Having the normal spool files lets us do data-filtering, and store/forward on temp-reject.
817d9f57
JH
4066
4067 XXX We do not handle queue-only, freezing, or blackholes.
e4bdf652 4068*/
5032d1cf 4069if(cutthrough.fd >= 0)
e4bdf652 4070 {
85ffcba6 4071 uschar * msg= cutthrough_finaldot(); /* Ask the target system to accept the message */
817d9f57 4072 /* Logging was done in finaldot() */
e4bdf652 4073 switch(msg[0])
817d9f57
JH
4074 {
4075 case '2': /* Accept. Do the same to the source; dump any spoolfiles. */
b784ce7f 4076 cutthrough_done = ACCEPTED;
817d9f57 4077 break; /* message_id needed for SMTP accept below */
61147df4 4078
ff5929e3
JH
4079 case '4': /* Temp-reject. Keep spoolfiles and accept, unless defer-pass mode.
4080 ... for which, pass back the exact error */
4081 if (cutthrough.defer_pass) smtp_reply = string_copy_malloc(msg);
4082 /*FALLTRHOUGH*/
4083
817d9f57 4084 default: /* Unknown response, or error. Treat as temp-reject. */
b784ce7f 4085 cutthrough_done = TMP_REJ; /* Avoid the usual immediate delivery attempt */
817d9f57 4086 break; /* message_id needed for SMTP accept below */
61147df4 4087
817d9f57 4088 case '5': /* Perm-reject. Do the same to the source. Dump any spoolfiles */
ff5929e3 4089 smtp_reply = string_copy_malloc(msg); /* Pass on the exact error */
b784ce7f 4090 cutthrough_done = PERM_REJ;
817d9f57
JH
4091 break;
4092 }
e4bdf652 4093 }
58eb016e 4094
8ccd00b1
JH
4095#ifndef DISABLE_PRDR
4096if(!smtp_reply || prdr_requested)
4097#else
4098if(!smtp_reply)
fd98a5c6 4099#endif
e4bdf652
JH
4100 {
4101 log_write(0, LOG_MAIN |
6c6d6e48
TF
4102 (LOGGING(received_recipients)? LOG_RECIPIENTS : 0) |
4103 (LOGGING(received_sender)? LOG_SENDER : 0),
e4bdf652
JH
4104 "%s", s);
4105
4106 /* Log any control actions taken by an ACL or local_scan(). */
58eb016e 4107
e4bdf652
JH
4108 if (deliver_freeze) log_write(0, LOG_MAIN, "frozen by %s", frozen_by);
4109 if (queue_only_policy) log_write(L_delay_delivery, LOG_MAIN,
e8012beb
JH
4110 "no immediate delivery: queued%s%s by %s",
4111 *queue_name ? " in " : "", *queue_name ? CS queue_name : "",
4112 queued_by);
e4bdf652
JH
4113 }
4114receive_call_bombout = FALSE;
58eb016e 4115
059ec3d9
PH
4116store_reset(s); /* The store for the main log message can be reused */
4117
4118/* If the message is frozen, and freeze_tell is set, do the telling. */
4119
4120if (deliver_freeze && freeze_tell != NULL && freeze_tell[0] != 0)
4121 {
4122 moan_tell_someone(freeze_tell, NULL, US"Message frozen on arrival",
4123 "Message %s was frozen on arrival by %s.\nThe sender is <%s>.\n",
4124 message_id, frozen_by, sender_address);
4125 }
4126
4127
4128/* Either a message has been successfully received and written to the two spool
4129files, or an error in writing the spool has occurred for an SMTP message, or
58eb016e
PH
4130an SMTP message has been rejected for policy reasons. (For a non-SMTP message
4131we will have already given up because there's no point in carrying on!) In
4132either event, we must now close (and thereby unlock) the data file. In the
059ec3d9
PH
4133successful case, this leaves the message on the spool, ready for delivery. In
4134the error case, the spool file will be deleted. Then tidy up store, interact
4135with an SMTP call if necessary, and return.
4136
4137A fflush() was done earlier in the expectation that any write errors on the
4138data file will be flushed(!) out thereby. Nevertheless, it is theoretically
4139possible for fclose() to fail - but what to do? What has happened to the lock
4140if this happens? */
4141
e4bdf652 4142
059ec3d9 4143TIDYUP:
f1e894f3
PH
4144process_info[process_info_len] = 0; /* Remove message id */
4145if (data_file != NULL) (void)fclose(data_file); /* Frees the lock */
059ec3d9
PH
4146
4147/* Now reset signal handlers to their defaults */
4148
4149signal(SIGTERM, SIG_DFL);
4150signal(SIGINT, SIG_DFL);
4151
4152/* Tell an SMTP caller the state of play, and arrange to return the SMTP return
4153value, which defaults TRUE - meaning there may be more incoming messages from
4154this connection. For non-SMTP callers (where there is only ever one message),
4155the default is FALSE. */
4156
4157if (smtp_input)
4158 {
4159 yield = smtp_yield;
4160
4161 /* Handle interactive SMTP callers. After several kinds of error, smtp_reply
58eb016e
PH
4162 is set to the response that should be sent. When it is NULL, we generate
4163 default responses. After an ACL error or local_scan() error, the response has
4164 already been sent, and smtp_reply is an empty string to indicate this. */
059ec3d9
PH
4165
4166 if (!smtp_batched_input)
4167 {
27b9e5f4 4168 if (!smtp_reply)
059ec3d9 4169 {
29aba418 4170 if (fake_response != OK)
27b9e5f4
JH
4171 smtp_respond(fake_response == DEFER ? US"450" : US"550",
4172 3, TRUE, fake_response_text);
4e88a19f
PH
4173
4174 /* An OK response is required; use "message" text if present. */
4175
27b9e5f4 4176 else if (user_msg)
4e88a19f
PH
4177 {
4178 uschar *code = US"250";
4179 int len = 3;
4f6ae5c3 4180 smtp_message_code(&code, &len, &user_msg, NULL, TRUE);
4e88a19f
PH
4181 smtp_respond(code, len, TRUE, user_msg);
4182 }
4183
4184 /* Default OK response */
4185
7e3ce68e
JH
4186 else if (chunking_state > CHUNKING_OFFERED)
4187 {
4188 smtp_printf("250- %u byte chunk, total %d\r\n250 OK id=%s\r\n",
4189 chunking_datasize, message_size+message_linecount, message_id);
4190 chunking_state = CHUNKING_OFFERED;
4191 }
8e669ac1
PH
4192 else
4193 smtp_printf("250 OK id=%s\r\n", message_id);
7e3ce68e 4194
059ec3d9
PH
4195 if (host_checking)
4196 fprintf(stdout,
4197 "\n**** SMTP testing: that is not a real message id!\n\n");
4198 }
4e88a19f 4199
58eb016e 4200 /* smtp_reply is set non-empty */
4e88a19f 4201
8523533c 4202 else if (smtp_reply[0] != 0)
29aba418 4203 if (fake_response != OK && (smtp_reply[0] == '2'))
a5bd321b
PH
4204 smtp_respond((fake_response == DEFER)? US"450" : US"550", 3, TRUE,
4205 fake_response_text);
8e669ac1 4206 else
6951ac6c 4207 smtp_printf("%.1024s\r\n", smtp_reply);
e4bdf652 4208
817d9f57
JH
4209 switch (cutthrough_done)
4210 {
ff5929e3
JH
4211 case ACCEPTED:
4212 log_write(0, LOG_MAIN, "Completed");/* Delivery was done */
41313d92 4213 case PERM_REJ:
ff5929e3
JH
4214 /* Delete spool files */
4215 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-D"));
4216 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-H"));
4217 Uunlink(spool_fname(US"msglog", message_subdir, message_id, US""));
4218 message_id[0] = 0; /* Prevent a delivery from starting */
4219 break;
4220
4221 case TMP_REJ:
4222 if (cutthrough.defer_pass)
4223 {
4224 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-D"));
4225 Uunlink(spool_fname(US"input", message_subdir, message_id, US"-H"));
4226 Uunlink(spool_fname(US"msglog", message_subdir, message_id, US""));
4227 }
4228 message_id[0] = 0; /* Prevent a delivery from starting */
4229 default:
4230 break;
e4bdf652 4231 }
5032d1cf 4232 cutthrough.delivery = FALSE;
ff5929e3 4233 cutthrough.defer_pass = FALSE;
059ec3d9
PH
4234 }
4235
4236 /* For batched SMTP, generate an error message on failure, and do
4237 nothing on success. The function moan_smtp_batch() does not return -
4238 it exits from the program with a non-zero return code. */
4239
27b9e5f4
JH
4240 else if (smtp_reply)
4241 moan_smtp_batch(NULL, "%s", smtp_reply);
059ec3d9
PH
4242 }
4243
4244
4245/* If blackholing, we can immediately log this message's sad fate. The data
4246file has already been unlinked, and the header file was never written to disk.
4247We must now indicate that nothing was received, to prevent a delivery from
4248starting. */
4249
27b9e5f4 4250if (blackholed_by)
059ec3d9 4251 {
55414b25
JH
4252 const uschar *detail = local_scan_data
4253 ? string_printing(local_scan_data)
4254 : string_sprintf("(%s discarded recipients)", blackholed_by);
04f7d5b9 4255 log_write(0, LOG_MAIN, "=> blackhole %s%s", detail, blackhole_log_msg);
059ec3d9
PH
4256 log_write(0, LOG_MAIN, "Completed");
4257 message_id[0] = 0;
4258 }
4259
4260/* Reset headers so that logging of rejects for a subsequent message doesn't
4261include them. It is also important to set header_last = NULL before exiting
4262from this function, as this prevents certain rewrites that might happen during
4263subsequent verifying (of another incoming message) from trying to add headers
4264when they shouldn't. */
4265
4266header_list = header_last = NULL;
4267
4268return yield; /* TRUE if more messages (SMTP only) */
4269}
4270
4271/* End of receive.c */