| 1 | /* $Cambridge: exim/src/src/receive.c,v 1.20 2005/06/27 14:29:43 ph10 Exp $ */ |
| 2 | |
| 3 | /************************************************* |
| 4 | * Exim - an Internet mail transport agent * |
| 5 | *************************************************/ |
| 6 | |
| 7 | /* Copyright (c) University of Cambridge 1995 - 2005 */ |
| 8 | /* See the file NOTICE for conditions of use and distribution. */ |
| 9 | |
| 10 | /* Code for receiving a message and setting up spool files. */ |
| 11 | |
| 12 | #include "exim.h" |
| 13 | |
| 14 | #ifdef EXPERIMENTAL_DOMAINKEYS |
| 15 | #define RECEIVE_GETC dk_receive_getc |
| 16 | #define RECEIVE_UNGETC dk_receive_ungetc |
| 17 | #else |
| 18 | #define RECEIVE_GETC receive_getc |
| 19 | #define RECEIVE_UNGETC receive_ungetc |
| 20 | #endif |
| 21 | |
| 22 | /************************************************* |
| 23 | * Local static variables * |
| 24 | *************************************************/ |
| 25 | |
| 26 | static FILE *data_file = NULL; |
| 27 | static int data_fd = -1; |
| 28 | static uschar spool_name[256]; |
| 29 | |
| 30 | |
| 31 | |
| 32 | /************************************************* |
| 33 | * Non-SMTP character reading functions * |
| 34 | *************************************************/ |
| 35 | |
| 36 | /* These are the default functions that are set up in the variables such as |
| 37 | receive_getc initially. They just call the standard functions, passing stdin as |
| 38 | the file. (When SMTP input is occurring, different functions are used by |
| 39 | changing the pointer variables.) */ |
| 40 | |
| 41 | int |
| 42 | stdin_getc(void) |
| 43 | { |
| 44 | return getc(stdin); |
| 45 | } |
| 46 | |
| 47 | int |
| 48 | stdin_ungetc(int c) |
| 49 | { |
| 50 | return ungetc(c, stdin); |
| 51 | } |
| 52 | |
| 53 | int |
| 54 | stdin_feof(void) |
| 55 | { |
| 56 | return feof(stdin); |
| 57 | } |
| 58 | |
| 59 | int |
| 60 | stdin_ferror(void) |
| 61 | { |
| 62 | return ferror(stdin); |
| 63 | } |
| 64 | |
| 65 | |
| 66 | |
| 67 | |
| 68 | /************************************************* |
| 69 | * Check that a set sender is allowed * |
| 70 | *************************************************/ |
| 71 | |
| 72 | /* This function is called when a local caller sets an explicit sender address. |
| 73 | It checks whether this is permitted, which it is for trusted callers. |
| 74 | Otherwise, it must match the pattern(s) in untrusted_set_sender. |
| 75 | |
| 76 | Arguments: the proposed sender address |
| 77 | Returns: TRUE for a trusted caller |
| 78 | TRUE if the address has been set, untrusted_set_sender has been |
| 79 | set, and the address matches something in the list |
| 80 | FALSE otherwise |
| 81 | */ |
| 82 | |
| 83 | BOOL |
| 84 | receive_check_set_sender(uschar *newsender) |
| 85 | { |
| 86 | uschar *qnewsender; |
| 87 | if (trusted_caller) return TRUE; |
| 88 | if (newsender == NULL || untrusted_set_sender == NULL) return FALSE; |
| 89 | qnewsender = (Ustrchr(newsender, '@') != NULL)? |
| 90 | newsender : string_sprintf("%s@%s", newsender, qualify_domain_sender); |
| 91 | return |
| 92 | match_address_list(qnewsender, TRUE, TRUE, &untrusted_set_sender, NULL, -1, |
| 93 | 0, NULL) == OK; |
| 94 | } |
| 95 | |
| 96 | |
| 97 | |
| 98 | |
| 99 | /************************************************* |
| 100 | * Read space info for a partition * |
| 101 | *************************************************/ |
| 102 | |
| 103 | /* This function is called by receive_check_fs() below, and also by string |
| 104 | expansion for variables such as $spool_space. The field names for the statvfs |
| 105 | structure are macros, because not all OS have F_FAVAIL and it seems tidier to |
| 106 | have macros for F_BAVAIL and F_FILES as well. Some kinds of file system do not |
| 107 | have inodes, and they return -1 for the number available. |
| 108 | |
| 109 | Later: It turns out that some file systems that do not have the concept of |
| 110 | inodes return 0 rather than -1. Such systems should also return 0 for the total |
| 111 | number of inodes, so we require that to be greater than zero before returning |
| 112 | an inode count. |
| 113 | |
| 114 | Arguments: |
| 115 | isspool TRUE for spool partition, FALSE for log partition |
| 116 | inodeptr address of int to receive inode count; -1 if there isn't one |
| 117 | |
| 118 | Returns: available on-root space, in kilobytes |
| 119 | -1 for log partition if there isn't one |
| 120 | |
| 121 | All values are -1 if the STATFS functions are not available. |
| 122 | */ |
| 123 | |
| 124 | int |
| 125 | receive_statvfs(BOOL isspool, int *inodeptr) |
| 126 | { |
| 127 | #ifdef HAVE_STATFS |
| 128 | struct STATVFS statbuf; |
| 129 | uschar *path; |
| 130 | uschar *name; |
| 131 | uschar buffer[1024]; |
| 132 | |
| 133 | /* The spool directory must always exist. */ |
| 134 | |
| 135 | if (isspool) |
| 136 | { |
| 137 | path = spool_directory; |
| 138 | name = US"spool"; |
| 139 | } |
| 140 | |
| 141 | /* Need to cut down the log file path to the directory, and to ignore any |
| 142 | appearance of "syslog" in it. */ |
| 143 | |
| 144 | else |
| 145 | { |
| 146 | int sep = ':'; /* Not variable - outside scripts use */ |
| 147 | uschar *p = log_file_path; |
| 148 | name = US"log"; |
| 149 | |
| 150 | /* An empty log_file_path means "use the default". This is the same as an |
| 151 | empty item in a list. */ |
| 152 | |
| 153 | if (*p == 0) p = US":"; |
| 154 | while ((path = string_nextinlist(&p, &sep, buffer, sizeof(buffer))) != NULL) |
| 155 | { |
| 156 | if (Ustrcmp(path, "syslog") != 0) break; |
| 157 | } |
| 158 | |
| 159 | if (path == NULL) /* No log files */ |
| 160 | { |
| 161 | *inodeptr = -1; |
| 162 | return -1; |
| 163 | } |
| 164 | |
| 165 | /* An empty string means use the default, which is in the spool directory. |
| 166 | But don't just use the spool directory, as it is possible that the log |
| 167 | subdirectory has been symbolically linked elsewhere. */ |
| 168 | |
| 169 | if (path[0] == 0) |
| 170 | { |
| 171 | sprintf(CS buffer, CS"%s/log", CS spool_directory); |
| 172 | path = buffer; |
| 173 | } |
| 174 | else |
| 175 | { |
| 176 | uschar *cp; |
| 177 | if ((cp = Ustrrchr(path, '/')) != NULL) *cp = 0; |
| 178 | } |
| 179 | } |
| 180 | |
| 181 | /* We now have the patch; do the business */ |
| 182 | |
| 183 | memset(&statbuf, 0, sizeof(statbuf)); |
| 184 | |
| 185 | if (STATVFS(CS path, &statbuf) != 0) |
| 186 | { |
| 187 | log_write(0, LOG_MAIN|LOG_PANIC, "cannot accept message: failed to stat " |
| 188 | "%s directory %s: %s", name, spool_directory, strerror(errno)); |
| 189 | smtp_closedown(US"spool or log directory problem"); |
| 190 | exim_exit(EXIT_FAILURE); |
| 191 | } |
| 192 | |
| 193 | *inodeptr = (statbuf.F_FILES > 0)? statbuf.F_FAVAIL : -1; |
| 194 | |
| 195 | /* Disks are getting huge. Take care with computing the size in kilobytes. */ |
| 196 | |
| 197 | return (int)(((double)statbuf.F_BAVAIL * (double)statbuf.F_FRSIZE)/1024.0); |
| 198 | |
| 199 | /* Unable to find partition sizes in this environment. */ |
| 200 | |
| 201 | #else |
| 202 | *inodeptr = -1; |
| 203 | return -1; |
| 204 | #endif |
| 205 | } |
| 206 | |
| 207 | |
| 208 | |
| 209 | |
| 210 | /************************************************* |
| 211 | * Check space on spool and log partitions * |
| 212 | *************************************************/ |
| 213 | |
| 214 | /* This function is called before accepting a message; if any thresholds are |
| 215 | set, it checks them. If a message_size is supplied, it checks that there is |
| 216 | enough space for that size plus the threshold - i.e. that the message won't |
| 217 | reduce the space to the threshold. Not all OS have statvfs(); for those that |
| 218 | don't, this function always returns TRUE. For some OS the old function and |
| 219 | struct name statfs is used; that is handled by a macro, defined in exim.h. |
| 220 | |
| 221 | Arguments: |
| 222 | msg_size the (estimated) size of an incoming message |
| 223 | |
| 224 | Returns: FALSE if there isn't enough space, or if the information cannot |
| 225 | be obtained |
| 226 | TRUE if no check was done or there is enough space |
| 227 | */ |
| 228 | |
| 229 | BOOL |
| 230 | receive_check_fs(int msg_size) |
| 231 | { |
| 232 | int space, inodes; |
| 233 | |
| 234 | if (check_spool_space > 0 || msg_size > 0 || check_spool_inodes > 0) |
| 235 | { |
| 236 | space = receive_statvfs(TRUE, &inodes); |
| 237 | |
| 238 | DEBUG(D_receive) |
| 239 | debug_printf("spool directory space = %dK inodes = %d " |
| 240 | "check_space = %dK inodes = %d msg_size = %d\n", |
| 241 | space, inodes, check_spool_space, check_spool_inodes, msg_size); |
| 242 | |
| 243 | if ((space >= 0 && space < check_spool_space) || |
| 244 | (inodes >= 0 && inodes < check_spool_inodes)) |
| 245 | { |
| 246 | log_write(0, LOG_MAIN, "spool directory space check failed: space=%d " |
| 247 | "inodes=%d", space, inodes); |
| 248 | return FALSE; |
| 249 | } |
| 250 | } |
| 251 | |
| 252 | if (check_log_space > 0 || check_log_inodes > 0) |
| 253 | { |
| 254 | space = receive_statvfs(FALSE, &inodes); |
| 255 | |
| 256 | DEBUG(D_receive) |
| 257 | debug_printf("log directory space = %dK inodes = %d " |
| 258 | "check_space = %dK inodes = %d\n", |
| 259 | space, inodes, check_log_space, check_log_inodes); |
| 260 | |
| 261 | if ((space >= 0 && space < check_log_space) || |
| 262 | (inodes >= 0 && inodes < check_log_inodes)) |
| 263 | { |
| 264 | log_write(0, LOG_MAIN, "log directory space check failed: space=%d " |
| 265 | "inodes=%d", space, inodes); |
| 266 | return FALSE; |
| 267 | } |
| 268 | } |
| 269 | |
| 270 | return TRUE; |
| 271 | } |
| 272 | |
| 273 | |
| 274 | |
| 275 | /************************************************* |
| 276 | * Bomb out while reading a message * |
| 277 | *************************************************/ |
| 278 | |
| 279 | /* The common case of wanting to bomb out is if a SIGTERM or SIGINT is |
| 280 | received, or if there is a timeout. A rarer case might be if the log files are |
| 281 | screwed up and Exim can't open them to record a message's arrival. Handling |
| 282 | that case is done by setting a flag to cause the log functions to call this |
| 283 | function if there is an ultimate disaster. That is why it is globally |
| 284 | accessible. |
| 285 | |
| 286 | Arguments: SMTP response to give if in an SMTP session |
| 287 | Returns: it doesn't |
| 288 | */ |
| 289 | |
| 290 | void |
| 291 | receive_bomb_out(uschar *msg) |
| 292 | { |
| 293 | /* If spool_name is set, it contains the name of the data file that is being |
| 294 | written. Unlink it before closing so that it cannot be picked up by a delivery |
| 295 | process. Ensure that any header file is also removed. */ |
| 296 | |
| 297 | if (spool_name[0] != 0) |
| 298 | { |
| 299 | Uunlink(spool_name); |
| 300 | spool_name[Ustrlen(spool_name) - 1] = 'H'; |
| 301 | Uunlink(spool_name); |
| 302 | } |
| 303 | |
| 304 | /* Now close the file if it is open, either as a fd or a stream. */ |
| 305 | |
| 306 | if (data_file != NULL) (void)fclose(data_file); |
| 307 | else if (data_fd >= 0) (void)close(data_fd); |
| 308 | |
| 309 | /* Attempt to close down an SMTP connection tidily. */ |
| 310 | |
| 311 | if (smtp_input) |
| 312 | { |
| 313 | if (!smtp_batched_input) |
| 314 | { |
| 315 | smtp_printf("421 %s %s - closing connection.\r\n", smtp_active_hostname, |
| 316 | msg); |
| 317 | mac_smtp_fflush(); |
| 318 | } |
| 319 | |
| 320 | /* Control does not return from moan_smtp_batch(). */ |
| 321 | |
| 322 | else moan_smtp_batch(NULL, "421 %s - message abandoned", msg); |
| 323 | } |
| 324 | |
| 325 | /* Exit from the program (non-BSMTP cases) */ |
| 326 | |
| 327 | exim_exit(EXIT_FAILURE); |
| 328 | } |
| 329 | |
| 330 | |
| 331 | /************************************************* |
| 332 | * Data read timeout * |
| 333 | *************************************************/ |
| 334 | |
| 335 | /* Handler function for timeouts that occur while reading the data that |
| 336 | comprises a message. |
| 337 | |
| 338 | Argument: the signal number |
| 339 | Returns: nothing |
| 340 | */ |
| 341 | |
| 342 | static void |
| 343 | data_timeout_handler(int sig) |
| 344 | { |
| 345 | uschar *msg = NULL; |
| 346 | |
| 347 | sig = sig; /* Keep picky compilers happy */ |
| 348 | |
| 349 | if (smtp_input) |
| 350 | { |
| 351 | msg = US"SMTP incoming data timeout"; |
| 352 | log_write(L_lost_incoming_connection, |
| 353 | LOG_MAIN, "SMTP data timeout (message abandoned) on connection " |
| 354 | "from %s F=<%s>", |
| 355 | (sender_fullhost != NULL)? sender_fullhost : US"local process", |
| 356 | sender_address); |
| 357 | } |
| 358 | else |
| 359 | { |
| 360 | fprintf(stderr, "exim: timed out while reading - message abandoned\n"); |
| 361 | log_write(L_lost_incoming_connection, |
| 362 | LOG_MAIN, "timed out while reading local message"); |
| 363 | } |
| 364 | |
| 365 | receive_bomb_out(msg); /* Does not return */ |
| 366 | } |
| 367 | |
| 368 | |
| 369 | |
| 370 | /************************************************* |
| 371 | * local_scan() timeout * |
| 372 | *************************************************/ |
| 373 | |
| 374 | /* Handler function for timeouts that occur while running a local_scan() |
| 375 | function. |
| 376 | |
| 377 | Argument: the signal number |
| 378 | Returns: nothing |
| 379 | */ |
| 380 | |
| 381 | static void |
| 382 | local_scan_timeout_handler(int sig) |
| 383 | { |
| 384 | sig = sig; /* Keep picky compilers happy */ |
| 385 | log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function timed out - " |
| 386 | "message temporarily rejected (size %d)", message_size); |
| 387 | receive_bomb_out(US"local verification problem"); /* Does not return */ |
| 388 | } |
| 389 | |
| 390 | |
| 391 | |
| 392 | /************************************************* |
| 393 | * local_scan() crashed * |
| 394 | *************************************************/ |
| 395 | |
| 396 | /* Handler function for signals that occur while running a local_scan() |
| 397 | function. |
| 398 | |
| 399 | Argument: the signal number |
| 400 | Returns: nothing |
| 401 | */ |
| 402 | |
| 403 | static void |
| 404 | local_scan_crash_handler(int sig) |
| 405 | { |
| 406 | log_write(0, LOG_MAIN|LOG_REJECT, "local_scan() function crashed with " |
| 407 | "signal %d - message temporarily rejected (size %d)", sig, message_size); |
| 408 | receive_bomb_out(US"local verification problem"); /* Does not return */ |
| 409 | } |
| 410 | |
| 411 | |
| 412 | /************************************************* |
| 413 | * SIGTERM or SIGINT received * |
| 414 | *************************************************/ |
| 415 | |
| 416 | /* Handler for SIGTERM or SIGINT signals that occur while reading the |
| 417 | data that comprises a message. |
| 418 | |
| 419 | Argument: the signal number |
| 420 | Returns: nothing |
| 421 | */ |
| 422 | |
| 423 | static void |
| 424 | data_sigterm_sigint_handler(int sig) |
| 425 | { |
| 426 | uschar *msg = NULL; |
| 427 | |
| 428 | if (smtp_input) |
| 429 | { |
| 430 | msg = US"Service not available - SIGTERM or SIGINT received"; |
| 431 | log_write(0, LOG_MAIN, "%s closed after %s", smtp_get_connection_info(), |
| 432 | (sig == SIGTERM)? "SIGTERM" : "SIGINT"); |
| 433 | } |
| 434 | else |
| 435 | { |
| 436 | if (filter_test == FTEST_NONE) |
| 437 | { |
| 438 | fprintf(stderr, "\nexim: %s received - message abandoned\n", |
| 439 | (sig == SIGTERM)? "SIGTERM" : "SIGINT"); |
| 440 | log_write(0, LOG_MAIN, "%s received while reading local message", |
| 441 | (sig == SIGTERM)? "SIGTERM" : "SIGINT"); |
| 442 | } |
| 443 | } |
| 444 | |
| 445 | receive_bomb_out(msg); /* Does not return */ |
| 446 | } |
| 447 | |
| 448 | |
| 449 | |
| 450 | /************************************************* |
| 451 | * Add new recipient to list * |
| 452 | *************************************************/ |
| 453 | |
| 454 | /* This function builds a list of recipient addresses in argc/argv |
| 455 | format. |
| 456 | |
| 457 | Arguments: |
| 458 | recipient the next address to add to recipients_list |
| 459 | pno parent number for fixed aliases; -1 otherwise |
| 460 | |
| 461 | Returns: nothing |
| 462 | */ |
| 463 | |
| 464 | void |
| 465 | receive_add_recipient(uschar *recipient, int pno) |
| 466 | { |
| 467 | if (recipients_count >= recipients_list_max) |
| 468 | { |
| 469 | recipient_item *oldlist = recipients_list; |
| 470 | int oldmax = recipients_list_max; |
| 471 | recipients_list_max = recipients_list_max? 2*recipients_list_max : 50; |
| 472 | recipients_list = store_get(recipients_list_max * sizeof(recipient_item)); |
| 473 | if (oldlist != NULL) |
| 474 | memcpy(recipients_list, oldlist, oldmax * sizeof(recipient_item)); |
| 475 | } |
| 476 | |
| 477 | recipients_list[recipients_count].address = recipient; |
| 478 | recipients_list[recipients_count].pno = pno; |
| 479 | #ifdef EXPERIMENTAL_BRIGHTMAIL |
| 480 | recipients_list[recipients_count].bmi_optin = bmi_current_optin; |
| 481 | /* reset optin string pointer for next recipient */ |
| 482 | bmi_current_optin = NULL; |
| 483 | #endif |
| 484 | recipients_list[recipients_count++].errors_to = NULL; |
| 485 | } |
| 486 | |
| 487 | |
| 488 | |
| 489 | |
| 490 | /************************************************* |
| 491 | * Remove a recipient from the list * |
| 492 | *************************************************/ |
| 493 | |
| 494 | /* This function is provided for local_scan() to use. |
| 495 | |
| 496 | Argument: |
| 497 | recipient address to remove |
| 498 | |
| 499 | Returns: TRUE if it did remove something; FALSE otherwise |
| 500 | */ |
| 501 | |
| 502 | BOOL |
| 503 | receive_remove_recipient(uschar *recipient) |
| 504 | { |
| 505 | int count; |
| 506 | DEBUG(D_receive) debug_printf("receive_remove_recipient(\"%s\") called\n", |
| 507 | recipient); |
| 508 | for (count = 0; count < recipients_count; count++) |
| 509 | { |
| 510 | if (Ustrcmp(recipients_list[count].address, recipient) == 0) |
| 511 | { |
| 512 | if ((--recipients_count - count) > 0) |
| 513 | memmove(recipients_list + count, recipients_list + count + 1, |
| 514 | (recipients_count - count)*sizeof(recipient_item)); |
| 515 | return TRUE; |
| 516 | } |
| 517 | } |
| 518 | return FALSE; |
| 519 | } |
| 520 | |
| 521 | |
| 522 | |
| 523 | |
| 524 | |
| 525 | /************************************************* |
| 526 | * Read data portion of a non-SMTP message * |
| 527 | *************************************************/ |
| 528 | |
| 529 | /* This function is called to read the remainder of a message (following the |
| 530 | header) when the input is not from SMTP - we are receiving a local message on |
| 531 | a standard input stream. The message is always terminated by EOF, and is also |
| 532 | terminated by a dot on a line by itself if the flag dot_ends is TRUE. Split the |
| 533 | two cases for maximum efficiency. |
| 534 | |
| 535 | Ensure that the body ends with a newline. This will naturally be the case when |
| 536 | the termination is "\n.\n" but may not be otherwise. The RFC defines messages |
| 537 | as "sequences of lines" - this of course strictly applies only to SMTP, but |
| 538 | deliveries into BSD-type mailbox files also require it. Exim used to have a |
| 539 | flag for doing this at delivery time, but as it was always set for all |
| 540 | transports, I decided to simplify things by putting the check here instead. |
| 541 | |
| 542 | There is at least one MUA (dtmail) that sends CRLF via this interface, and |
| 543 | other programs are known to do this as well. Exim used to have a option for |
| 544 | dealing with this: in July 2003, after much discussion, the code has been |
| 545 | changed to default to treat any of LF, CRLF, and bare CR as line terminators. |
| 546 | |
| 547 | However, for the case when a dot on a line by itself terminates a message, the |
| 548 | only recognized terminating sequences before and after the dot are LF and CRLF. |
| 549 | Otherwise, having read EOL . CR, you don't know whether to read another |
| 550 | character or not. |
| 551 | |
| 552 | Internally, in messages stored in Exim's spool files, LF is used as the line |
| 553 | terminator. Under the new regime, bare CRs will no longer appear in these |
| 554 | files. |
| 555 | |
| 556 | Arguments: |
| 557 | fout a FILE to which to write the message |
| 558 | |
| 559 | Returns: One of the END_xxx values indicating why it stopped reading |
| 560 | */ |
| 561 | |
| 562 | static int |
| 563 | read_message_data(FILE *fout) |
| 564 | { |
| 565 | int ch_state; |
| 566 | register int ch; |
| 567 | |
| 568 | /* Handle the case when only EOF terminates the message */ |
| 569 | |
| 570 | if (!dot_ends) |
| 571 | { |
| 572 | register int last_ch = '\n'; |
| 573 | |
| 574 | for (; (ch = (RECEIVE_GETC)()) != EOF; last_ch = ch) |
| 575 | { |
| 576 | if (ch == 0) body_zerocount++; |
| 577 | if (last_ch == '\r' && ch != '\n') |
| 578 | { |
| 579 | if (fputc('\n', fout) == EOF) return END_WERROR; |
| 580 | message_size++; |
| 581 | body_linecount++; |
| 582 | } |
| 583 | if (ch == '\r') continue; |
| 584 | |
| 585 | if (fputc(ch, fout) == EOF) return END_WERROR; |
| 586 | if (ch == '\n') body_linecount++; |
| 587 | if (++message_size > thismessage_size_limit) return END_SIZE; |
| 588 | } |
| 589 | |
| 590 | if (last_ch != '\n') |
| 591 | { |
| 592 | if (fputc('\n', fout) == EOF) return END_WERROR; |
| 593 | message_size++; |
| 594 | body_linecount++; |
| 595 | } |
| 596 | |
| 597 | return END_EOF; |
| 598 | } |
| 599 | |
| 600 | /* Handle the case when a dot on a line on its own, or EOF, terminates. */ |
| 601 | |
| 602 | ch_state = 1; |
| 603 | |
| 604 | while ((ch = (RECEIVE_GETC)()) != EOF) |
| 605 | { |
| 606 | if (ch == 0) body_zerocount++; |
| 607 | switch (ch_state) |
| 608 | { |
| 609 | case 0: /* Normal state (previous char written) */ |
| 610 | if (ch == '\n') |
| 611 | { body_linecount++; ch_state = 1; } |
| 612 | else if (ch == '\r') |
| 613 | { ch_state = 2; continue; } |
| 614 | break; |
| 615 | |
| 616 | case 1: /* After written "\n" */ |
| 617 | if (ch == '.') { ch_state = 3; continue; } |
| 618 | if (ch != '\n') ch_state = 0; |
| 619 | break; |
| 620 | |
| 621 | case 2: |
| 622 | body_linecount++; /* After unwritten "\r" */ |
| 623 | if (ch == '\n') |
| 624 | { ch_state = 1; } |
| 625 | else |
| 626 | { |
| 627 | if (message_size++, fputc('\n', fout) == EOF) return END_WERROR; |
| 628 | if (ch == '\r') continue; |
| 629 | ch_state = 0; |
| 630 | } |
| 631 | break; |
| 632 | |
| 633 | case 3: /* After "\n." (\n written, dot not) */ |
| 634 | if (ch == '\n') return END_DOT; |
| 635 | if (ch == '\r') { ch_state = 4; continue; } |
| 636 | message_size++; |
| 637 | if (fputc('.', fout) == EOF) return END_WERROR; |
| 638 | ch_state = 0; |
| 639 | break; |
| 640 | |
| 641 | case 4: /* After "\n.\r" (\n written, rest not) */ |
| 642 | if (ch == '\n') return END_DOT; |
| 643 | message_size += 2; |
| 644 | body_linecount++; |
| 645 | if (fputs(".\n", fout) == EOF) return END_WERROR; |
| 646 | if (ch == '\r') { ch_state = 2; continue; } |
| 647 | ch_state = 0; |
| 648 | break; |
| 649 | } |
| 650 | |
| 651 | if (fputc(ch, fout) == EOF) return END_WERROR; |
| 652 | if (++message_size > thismessage_size_limit) return END_SIZE; |
| 653 | } |
| 654 | |
| 655 | /* Get here if EOF read. Unless we have just written "\n", we need to ensure |
| 656 | the message ends with a newline, and we must also write any characters that |
| 657 | were saved up while testing for an ending dot. */ |
| 658 | |
| 659 | if (ch_state != 1) |
| 660 | { |
| 661 | static uschar *ends[] = { US"\n", NULL, US"\n", US".\n", US".\n" }; |
| 662 | if (fputs(CS ends[ch_state], fout) == EOF) return END_WERROR; |
| 663 | message_size += Ustrlen(ends[ch_state]); |
| 664 | body_linecount++; |
| 665 | } |
| 666 | |
| 667 | return END_EOF; |
| 668 | } |
| 669 | |
| 670 | |
| 671 | |
| 672 | |
| 673 | /************************************************* |
| 674 | * Read data portion of an SMTP message * |
| 675 | *************************************************/ |
| 676 | |
| 677 | /* This function is called to read the remainder of an SMTP message (after the |
| 678 | headers), or to skip over it when an error has occurred. In this case, the |
| 679 | output file is passed as NULL. |
| 680 | |
| 681 | If any line begins with a dot, that character is skipped. The input should only |
| 682 | be successfully terminated by CR LF . CR LF unless it is local (non-network) |
| 683 | SMTP, in which case the CRs are optional, but... |
| 684 | |
| 685 | FUDGE: It seems that sites on the net send out messages with just LF |
| 686 | terminators, despite the warnings in the RFCs, and other MTAs handle this. So |
| 687 | we make the CRs optional in all cases. |
| 688 | |
| 689 | July 2003: Bare CRs cause trouble. We now treat them as line terminators as |
| 690 | well, so that there are no CRs in spooled messages. However, the message |
| 691 | terminating dot is not recognized between two bare CRs. |
| 692 | |
| 693 | Arguments: |
| 694 | fout a FILE to which to write the message; NULL if skipping |
| 695 | |
| 696 | Returns: One of the END_xxx values indicating why it stopped reading |
| 697 | */ |
| 698 | |
| 699 | static int |
| 700 | read_message_data_smtp(FILE *fout) |
| 701 | { |
| 702 | int ch_state = 0; |
| 703 | register int ch; |
| 704 | |
| 705 | while ((ch = (RECEIVE_GETC)()) != EOF) |
| 706 | { |
| 707 | if (ch == 0) body_zerocount++; |
| 708 | switch (ch_state) |
| 709 | { |
| 710 | case 0: /* After LF or CRLF */ |
| 711 | if (ch == '.') |
| 712 | { |
| 713 | ch_state = 3; |
| 714 | continue; /* Don't ever write . after LF */ |
| 715 | } |
| 716 | ch_state = 1; |
| 717 | |
| 718 | /* Else fall through to handle as normal uschar. */ |
| 719 | |
| 720 | case 1: /* Normal state */ |
| 721 | if (ch == '\n') |
| 722 | { |
| 723 | ch_state = 0; |
| 724 | body_linecount++; |
| 725 | } |
| 726 | else if (ch == '\r') |
| 727 | { |
| 728 | ch_state = 2; |
| 729 | continue; |
| 730 | } |
| 731 | break; |
| 732 | |
| 733 | case 2: /* After (unwritten) CR */ |
| 734 | body_linecount++; |
| 735 | if (ch == '\n') |
| 736 | { |
| 737 | ch_state = 0; |
| 738 | } |
| 739 | else |
| 740 | { |
| 741 | message_size++; |
| 742 | if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR; |
| 743 | if (ch != '\r') ch_state = 1; else continue; |
| 744 | } |
| 745 | break; |
| 746 | |
| 747 | case 3: /* After [CR] LF . */ |
| 748 | if (ch == '\n') |
| 749 | return END_DOT; |
| 750 | if (ch == '\r') |
| 751 | { |
| 752 | ch_state = 4; |
| 753 | continue; |
| 754 | } |
| 755 | ch_state = 1; /* The dot itself is removed */ |
| 756 | break; |
| 757 | |
| 758 | case 4: /* After [CR] LF . CR */ |
| 759 | if (ch == '\n') return END_DOT; |
| 760 | message_size++; |
| 761 | body_linecount++; |
| 762 | if (fout != NULL && fputc('\n', fout) == EOF) return END_WERROR; |
| 763 | if (ch == '\r') |
| 764 | { |
| 765 | ch_state = 2; |
| 766 | continue; |
| 767 | } |
| 768 | ch_state = 1; |
| 769 | break; |
| 770 | } |
| 771 | |
| 772 | /* Add the character to the spool file, unless skipping; then loop for the |
| 773 | next. */ |
| 774 | |
| 775 | message_size++; |
| 776 | if (fout != NULL) |
| 777 | { |
| 778 | if (fputc(ch, fout) == EOF) return END_WERROR; |
| 779 | if (message_size > thismessage_size_limit) return END_SIZE; |
| 780 | } |
| 781 | } |
| 782 | |
| 783 | /* Fall through here if EOF encountered. This indicates some kind of error, |
| 784 | since a correct message is terminated by [CR] LF . [CR] LF. */ |
| 785 | |
| 786 | return END_EOF; |
| 787 | } |
| 788 | |
| 789 | |
| 790 | |
| 791 | |
| 792 | /************************************************* |
| 793 | * Swallow SMTP message * |
| 794 | *************************************************/ |
| 795 | |
| 796 | /* This function is called when there has been some kind of error while reading |
| 797 | an SMTP message, and the remaining data may need to be swallowed. It is global |
| 798 | because it is called from smtp_closedown() to shut down an incoming call |
| 799 | tidily. |
| 800 | |
| 801 | Argument: a FILE from which to read the message |
| 802 | Returns: nothing |
| 803 | */ |
| 804 | |
| 805 | void |
| 806 | receive_swallow_smtp(void) |
| 807 | { |
| 808 | if (message_ended >= END_NOTENDED) |
| 809 | message_ended = read_message_data_smtp(NULL); |
| 810 | } |
| 811 | |
| 812 | |
| 813 | |
| 814 | /************************************************* |
| 815 | * Handle lost SMTP connection * |
| 816 | *************************************************/ |
| 817 | |
| 818 | /* This function logs connection loss incidents and generates an appropriate |
| 819 | SMTP response. |
| 820 | |
| 821 | Argument: additional data for the message |
| 822 | Returns: the SMTP response |
| 823 | */ |
| 824 | |
| 825 | static uschar * |
| 826 | handle_lost_connection(uschar *s) |
| 827 | { |
| 828 | log_write(L_lost_incoming_connection | L_smtp_connection, LOG_MAIN, |
| 829 | "%s lost while reading message data%s", smtp_get_connection_info(), s); |
| 830 | return US"421 Lost incoming connection"; |
| 831 | } |
| 832 | |
| 833 | |
| 834 | |
| 835 | |
| 836 | /************************************************* |
| 837 | * Handle a non-smtp reception error * |
| 838 | *************************************************/ |
| 839 | |
| 840 | /* This function is called for various errors during the reception of non-SMTP |
| 841 | messages. It either sends a message to the sender of the problem message, or it |
| 842 | writes to the standard error stream. |
| 843 | |
| 844 | Arguments: |
| 845 | errcode code for moan_to_sender(), identifying the error |
| 846 | text1 first message text, passed to moan_to_sender() |
| 847 | text2 second message text, used only for stderrr |
| 848 | error_rc code to pass to exim_exit if no problem |
| 849 | f FILE containing body of message (may be stdin) |
| 850 | hptr pointer to instore headers or NULL |
| 851 | |
| 852 | Returns: calls exim_exit(), which does not return |
| 853 | */ |
| 854 | |
| 855 | static void |
| 856 | give_local_error(int errcode, uschar *text1, uschar *text2, int error_rc, |
| 857 | FILE *f, header_line *hptr) |
| 858 | { |
| 859 | if (error_handling == ERRORS_SENDER) |
| 860 | { |
| 861 | error_block eblock; |
| 862 | eblock.next = NULL; |
| 863 | eblock.text1 = text1; |
| 864 | if (!moan_to_sender(errcode, &eblock, hptr, f, FALSE)) |
| 865 | error_rc = EXIT_FAILURE; |
| 866 | } |
| 867 | else fprintf(stderr, "exim: %s%s\n", text2, text1); /* Sic */ |
| 868 | (void)fclose(f); |
| 869 | exim_exit(error_rc); |
| 870 | } |
| 871 | |
| 872 | |
| 873 | |
| 874 | /************************************************* |
| 875 | * Add header lines set up by ACL * |
| 876 | *************************************************/ |
| 877 | |
| 878 | /* This function is called to add the header lines that were set up by "warn" |
| 879 | statements in an ACL onto the list of headers in memory. It is done in two |
| 880 | stages like this, because when the ACL for RCPT is running, the other headers |
| 881 | have not yet been received. This function is called twice; once just before |
| 882 | running the DATA ACL, and once after. This is so that header lines added by |
| 883 | MAIL or RCPT are visible to the DATA ACL. |
| 884 | |
| 885 | Originally these header lines were added at the end. Now there is support for |
| 886 | three different places: top, bottom, and after the Received: header(s). There |
| 887 | will always be at least one Received: header, even if it is marked deleted, and |
| 888 | even if something else has been put in front of it. |
| 889 | |
| 890 | Arguments: |
| 891 | acl_name text to identify which ACL |
| 892 | |
| 893 | Returns: nothing |
| 894 | */ |
| 895 | |
| 896 | static void |
| 897 | add_acl_headers(uschar *acl_name) |
| 898 | { |
| 899 | header_line *h, *next; |
| 900 | header_line *last_received = NULL; |
| 901 | |
| 902 | if (acl_warn_headers == NULL) return; |
| 903 | DEBUG(D_receive|D_acl) debug_printf(">>Headers added by %s ACL:\n", acl_name); |
| 904 | |
| 905 | for (h = acl_warn_headers; h != NULL; h = next) |
| 906 | { |
| 907 | next = h->next; |
| 908 | |
| 909 | switch(h->type) |
| 910 | { |
| 911 | case htype_add_top: |
| 912 | h->next = header_list; |
| 913 | header_list = h; |
| 914 | DEBUG(D_receive|D_acl) debug_printf(" (at top)"); |
| 915 | break; |
| 916 | |
| 917 | case htype_add_rec: |
| 918 | if (last_received == NULL) |
| 919 | { |
| 920 | last_received = header_list; |
| 921 | while (!header_testname(last_received, US"Received", 8, FALSE)) |
| 922 | last_received = last_received->next; |
| 923 | while (last_received->next != NULL && |
| 924 | header_testname(last_received->next, US"Received", 8, FALSE)) |
| 925 | last_received = last_received->next; |
| 926 | } |
| 927 | h->next = last_received->next; |
| 928 | last_received->next = h; |
| 929 | DEBUG(D_receive|D_acl) debug_printf(" (after Received:)"); |
| 930 | break; |
| 931 | |
| 932 | case htype_add_rfc: |
| 933 | /* add header before any header which is NOT Received: or Resent- */ |
| 934 | last_received = header_list; |
| 935 | while ( (last_received->next != NULL) && |
| 936 | ( (header_testname(last_received->next, US"Received", 8, FALSE)) || |
| 937 | (header_testname_incomplete(last_received->next, US"Resent-", 7, FALSE)) ) ) |
| 938 | last_received = last_received->next; |
| 939 | /* last_received now points to the last Received: or Resent-* header |
| 940 | in an uninterrupted chain of those header types (seen from the beginning |
| 941 | of all headers. Our current header must follow it. */ |
| 942 | h->next = last_received->next; |
| 943 | last_received->next = h; |
| 944 | DEBUG(D_receive|D_acl) debug_printf(" (before any non-Received: or Resent-*: header)"); |
| 945 | break; |
| 946 | |
| 947 | default: |
| 948 | h->next = NULL; |
| 949 | header_last->next = h; |
| 950 | break; |
| 951 | } |
| 952 | |
| 953 | if (h->next == NULL) header_last = h; |
| 954 | |
| 955 | /* Check for one of the known header types (From:, To:, etc.) though in |
| 956 | practice most added headers are going to be "other". Lower case |
| 957 | identification letters are never stored with the header; they are used |
| 958 | for existence tests when messages are received. So discard any lower case |
| 959 | flag values. */ |
| 960 | |
| 961 | h->type = header_checkname(h, FALSE); |
| 962 | if (h->type >= 'a') h->type = htype_other; |
| 963 | |
| 964 | DEBUG(D_receive|D_acl) debug_printf(" %s", header_last->text); |
| 965 | } |
| 966 | |
| 967 | acl_warn_headers = NULL; |
| 968 | DEBUG(D_receive|D_acl) debug_printf(">>\n"); |
| 969 | } |
| 970 | |
| 971 | |
| 972 | |
| 973 | /************************************************* |
| 974 | * Add host information for log line * |
| 975 | *************************************************/ |
| 976 | |
| 977 | /* Called for acceptance and rejecting log lines. This adds information about |
| 978 | the calling host to a string that is being built dynamically. |
| 979 | |
| 980 | Arguments: |
| 981 | s the dynamic string |
| 982 | sizeptr points to the size variable |
| 983 | ptrptr points to the pointer variable |
| 984 | |
| 985 | Returns: the extended string |
| 986 | */ |
| 987 | |
| 988 | static uschar * |
| 989 | add_host_info_for_log(uschar *s, int *sizeptr, int *ptrptr) |
| 990 | { |
| 991 | if (sender_fullhost != NULL) |
| 992 | { |
| 993 | s = string_append(s, sizeptr, ptrptr, 2, US" H=", sender_fullhost); |
| 994 | if ((log_extra_selector & LX_incoming_interface) != 0 && |
| 995 | interface_address != NULL) |
| 996 | { |
| 997 | uschar *ss = string_sprintf(" I=[%s]:%d", interface_address, |
| 998 | interface_port); |
| 999 | s = string_cat(s, sizeptr, ptrptr, ss, Ustrlen(ss)); |
| 1000 | } |
| 1001 | } |
| 1002 | if (sender_ident != NULL) |
| 1003 | s = string_append(s, sizeptr, ptrptr, 2, US" U=", sender_ident); |
| 1004 | if (received_protocol != NULL) |
| 1005 | s = string_append(s, sizeptr, ptrptr, 2, US" P=", received_protocol); |
| 1006 | return s; |
| 1007 | } |
| 1008 | |
| 1009 | |
| 1010 | |
| 1011 | #ifdef WITH_CONTENT_SCAN |
| 1012 | |
| 1013 | /************************************************* |
| 1014 | * Run the MIME ACL on a message * |
| 1015 | *************************************************/ |
| 1016 | |
| 1017 | /* This code is in a subroutine so that it can be used for both SMTP |
| 1018 | and non-SMTP messages. It is called with a non-NULL ACL pointer. |
| 1019 | |
| 1020 | Arguments: |
| 1021 | acl The ACL to run (acl_smtp_mime or acl_not_smtp_mime) |
| 1022 | smtp_yield_ptr Set FALSE to kill messages after dropped connection |
| 1023 | smtp_reply_ptr Where SMTP reply is being built |
| 1024 | blackholed_by_ptr Where "blackholed by" message is being built |
| 1025 | |
| 1026 | Returns: TRUE to carry on; FALSE to abandon the message |
| 1027 | */ |
| 1028 | |
| 1029 | static BOOL |
| 1030 | run_mime_acl(uschar *acl, BOOL *smtp_yield_ptr, uschar **smtp_reply_ptr, |
| 1031 | uschar **blackholed_by_ptr) |
| 1032 | { |
| 1033 | FILE *mbox_file; |
| 1034 | uschar rfc822_file_path[2048]; |
| 1035 | unsigned long mbox_size; |
| 1036 | header_line *my_headerlist; |
| 1037 | uschar *user_msg, *log_msg; |
| 1038 | int mime_part_count_buffer = -1; |
| 1039 | int rc; |
| 1040 | |
| 1041 | memset(CS rfc822_file_path,0,2048); |
| 1042 | |
| 1043 | /* check if it is a MIME message */ |
| 1044 | my_headerlist = header_list; |
| 1045 | while (my_headerlist != NULL) { |
| 1046 | /* skip deleted headers */ |
| 1047 | if (my_headerlist->type == '*') { |
| 1048 | my_headerlist = my_headerlist->next; |
| 1049 | continue; |
| 1050 | }; |
| 1051 | if (strncmpic(my_headerlist->text, US"Content-Type:", 13) == 0) { |
| 1052 | DEBUG(D_receive) debug_printf("Found Content-Type: header - executing acl_smtp_mime.\n"); |
| 1053 | goto DO_MIME_ACL; |
| 1054 | }; |
| 1055 | my_headerlist = my_headerlist->next; |
| 1056 | }; |
| 1057 | |
| 1058 | DEBUG(D_receive) debug_printf("No Content-Type: header - presumably not a MIME message.\n"); |
| 1059 | return TRUE; |
| 1060 | |
| 1061 | DO_MIME_ACL: |
| 1062 | /* make sure the eml mbox file is spooled up */ |
| 1063 | mbox_file = spool_mbox(&mbox_size); |
| 1064 | if (mbox_file == NULL) { |
| 1065 | /* error while spooling */ |
| 1066 | log_write(0, LOG_MAIN|LOG_PANIC, |
| 1067 | "acl_smtp_mime: error while creating mbox spool file, message temporarily rejected."); |
| 1068 | Uunlink(spool_name); |
| 1069 | unspool_mbox(); |
| 1070 | smtp_respond(451, TRUE, US"temporary local problem"); |
| 1071 | message_id[0] = 0; /* Indicate no message accepted */ |
| 1072 | *smtp_reply_ptr = US""; /* Indicate reply already sent */ |
| 1073 | return FALSE; /* Indicate skip to end of receive function */ |
| 1074 | }; |
| 1075 | |
| 1076 | mime_is_rfc822 = 0; |
| 1077 | |
| 1078 | MIME_ACL_CHECK: |
| 1079 | mime_part_count = -1; |
| 1080 | rc = mime_acl_check(acl, mbox_file, NULL, &user_msg, &log_msg); |
| 1081 | (void)fclose(mbox_file); |
| 1082 | |
| 1083 | if (Ustrlen(rfc822_file_path) > 0) { |
| 1084 | mime_part_count = mime_part_count_buffer; |
| 1085 | |
| 1086 | if (unlink(CS rfc822_file_path) == -1) { |
| 1087 | log_write(0, LOG_PANIC, |
| 1088 | "acl_smtp_mime: can't unlink RFC822 spool file, skipping."); |
| 1089 | goto END_MIME_ACL; |
| 1090 | }; |
| 1091 | }; |
| 1092 | |
| 1093 | /* check if we must check any message/rfc822 attachments */ |
| 1094 | if (rc == OK) { |
| 1095 | uschar temp_path[1024]; |
| 1096 | int n; |
| 1097 | struct dirent *entry; |
| 1098 | DIR *tempdir; |
| 1099 | |
| 1100 | snprintf(CS temp_path, 1024, "%s/scan/%s", spool_directory, message_id); |
| 1101 | |
| 1102 | tempdir = opendir(CS temp_path); |
| 1103 | n = 0; |
| 1104 | do { |
| 1105 | entry = readdir(tempdir); |
| 1106 | if (entry == NULL) break; |
| 1107 | if (strncmpic(US entry->d_name,US"__rfc822_",9) == 0) { |
| 1108 | snprintf(CS rfc822_file_path, 2048,"%s/scan/%s/%s", spool_directory, message_id, entry->d_name); |
| 1109 | debug_printf("RFC822 attachment detected: running MIME ACL for '%s'\n", rfc822_file_path); |
| 1110 | break; |
| 1111 | }; |
| 1112 | } while (1); |
| 1113 | closedir(tempdir); |
| 1114 | |
| 1115 | if (entry != NULL) { |
| 1116 | mbox_file = Ufopen(rfc822_file_path,"r"); |
| 1117 | if (mbox_file == NULL) { |
| 1118 | log_write(0, LOG_PANIC, |
| 1119 | "acl_smtp_mime: can't open RFC822 spool file, skipping."); |
| 1120 | unlink(CS rfc822_file_path); |
| 1121 | goto END_MIME_ACL; |
| 1122 | }; |
| 1123 | /* set RFC822 expansion variable */ |
| 1124 | mime_is_rfc822 = 1; |
| 1125 | mime_part_count_buffer = mime_part_count; |
| 1126 | goto MIME_ACL_CHECK; |
| 1127 | }; |
| 1128 | }; |
| 1129 | |
| 1130 | END_MIME_ACL: |
| 1131 | add_acl_headers(US"MIME"); |
| 1132 | if (rc == DISCARD) |
| 1133 | { |
| 1134 | recipients_count = 0; |
| 1135 | *blackholed_by_ptr = US"MIME ACL"; |
| 1136 | } |
| 1137 | else if (rc != OK) |
| 1138 | { |
| 1139 | Uunlink(spool_name); |
| 1140 | unspool_mbox(); |
| 1141 | if (smtp_handle_acl_fail(ACL_WHERE_MIME, rc, user_msg, log_msg) != 0) |
| 1142 | *smtp_yield_ptr = FALSE; /* No more messsages after dropped connection */ |
| 1143 | *smtp_reply_ptr = US""; /* Indicate reply already sent */ |
| 1144 | message_id[0] = 0; /* Indicate no message accepted */ |
| 1145 | return FALSE; /* Cause skip to end of receive function */ |
| 1146 | }; |
| 1147 | |
| 1148 | return TRUE; |
| 1149 | } |
| 1150 | |
| 1151 | #endif /* WITH_CONTENT_SCAN */ |
| 1152 | |
| 1153 | |
| 1154 | /************************************************* |
| 1155 | * Receive message * |
| 1156 | *************************************************/ |
| 1157 | |
| 1158 | /* Receive a message on the given input, and put it into a pair of spool files. |
| 1159 | Either a non-null list of recipients, or the extract flag will be true, or |
| 1160 | both. The flag sender_local is true for locally generated messages. The flag |
| 1161 | submission_mode is true if an ACL has obeyed "control = submission". The flag |
| 1162 | smtp_input is true if the message is to be handled using SMTP conventions about |
| 1163 | termination and lines starting with dots. For non-SMTP messages, dot_ends is |
| 1164 | true for dot-terminated messages. |
| 1165 | |
| 1166 | If a message was successfully read, message_id[0] will be non-zero. |
| 1167 | |
| 1168 | The general actions of this function are: |
| 1169 | |
| 1170 | . Read the headers of the message (if any) into a chain of store |
| 1171 | blocks. |
| 1172 | |
| 1173 | . If there is a "sender:" header and the message is locally originated, |
| 1174 | throw it away, unless the caller is trusted, or unless |
| 1175 | active_local_sender_retain is set - which can only happen if |
| 1176 | active_local_from_check is false. |
| 1177 | |
| 1178 | . If recipients are to be extracted from the message, build the |
| 1179 | recipients list from the headers, removing any that were on the |
| 1180 | original recipients list (unless extract_addresses_remove_arguments is |
| 1181 | false), and at the same time, remove any bcc header that may be present. |
| 1182 | |
| 1183 | . Get the spool file for the data, sort out its unique name, open |
| 1184 | and lock it (but don't give it the name yet). |
| 1185 | |
| 1186 | . Generate a "Message-Id" header if the message doesn't have one, for |
| 1187 | locally-originated messages. |
| 1188 | |
| 1189 | . Generate a "Received" header. |
| 1190 | |
| 1191 | . Ensure the recipients list is fully qualified and rewritten if necessary. |
| 1192 | |
| 1193 | . If there are any rewriting rules, apply them to the sender address |
| 1194 | and also to the headers. |
| 1195 | |
| 1196 | . If there is no from: header, generate one, for locally-generated messages |
| 1197 | and messages in "submission mode" only. |
| 1198 | |
| 1199 | . If the sender is local, check that from: is correct, and if not, generate |
| 1200 | a Sender: header, unless message comes from a trusted caller, or this |
| 1201 | feature is disabled by active_local_from_check being false. |
| 1202 | |
| 1203 | . If there is no "date" header, generate one, for locally-originated |
| 1204 | or submission mode messages only. |
| 1205 | |
| 1206 | . Copy the rest of the input, or up to a terminating "." if in SMTP or |
| 1207 | dot_ends mode, to the data file. Leave it open, to hold the lock. |
| 1208 | |
| 1209 | . Write the envelope and the headers to a new file. |
| 1210 | |
| 1211 | . Set the name for the header file; close it. |
| 1212 | |
| 1213 | . Set the name for the data file; close it. |
| 1214 | |
| 1215 | Because this function can potentially be called many times in a single |
| 1216 | SMTP connection, all store should be got by store_get(), so that it will be |
| 1217 | automatically retrieved after the message is accepted. |
| 1218 | |
| 1219 | FUDGE: It seems that sites on the net send out messages with just LF |
| 1220 | terminators, despite the warnings in the RFCs, and other MTAs handle this. So |
| 1221 | we make the CRs optional in all cases. |
| 1222 | |
| 1223 | July 2003: Bare CRs in messages, especially in header lines, cause trouble. A |
| 1224 | new regime is now in place in which bare CRs in header lines are turned into LF |
| 1225 | followed by a space, so as not to terminate the header line. |
| 1226 | |
| 1227 | February 2004: A bare LF in a header line in a message whose first line was |
| 1228 | terminated by CRLF is treated in the same way as a bare CR. |
| 1229 | |
| 1230 | Arguments: |
| 1231 | extract_recip TRUE if recipients are to be extracted from the message's |
| 1232 | headers |
| 1233 | |
| 1234 | Returns: TRUE there are more messages to be read (SMTP input) |
| 1235 | FALSE there are no more messages to be read (non-SMTP input |
| 1236 | or SMTP connection collapsed, or other failure) |
| 1237 | |
| 1238 | When reading a message for filter testing, the returned value indicates |
| 1239 | whether the headers (which is all that is read) were terminated by '.' or |
| 1240 | not. */ |
| 1241 | |
| 1242 | BOOL |
| 1243 | receive_msg(BOOL extract_recip) |
| 1244 | { |
| 1245 | int i, rc; |
| 1246 | int msg_size = 0; |
| 1247 | int process_info_len = Ustrlen(process_info); |
| 1248 | int error_rc = (error_handling == ERRORS_SENDER)? |
| 1249 | errors_sender_rc : EXIT_FAILURE; |
| 1250 | int header_size = 256; |
| 1251 | int start, end, domain, size, sptr; |
| 1252 | int id_resolution; |
| 1253 | int had_zero = 0; |
| 1254 | |
| 1255 | register int ptr = 0; |
| 1256 | |
| 1257 | BOOL contains_resent_headers = FALSE; |
| 1258 | BOOL extracted_ignored = FALSE; |
| 1259 | BOOL first_line_ended_crlf = TRUE_UNSET; |
| 1260 | BOOL smtp_yield = TRUE; |
| 1261 | BOOL yield = FALSE; |
| 1262 | |
| 1263 | BOOL resents_exist = FALSE; |
| 1264 | uschar *resent_prefix = US""; |
| 1265 | uschar *blackholed_by = NULL; |
| 1266 | uschar *blackhole_log_msg = US""; |
| 1267 | |
| 1268 | flock_t lock_data; |
| 1269 | error_block *bad_addresses = NULL; |
| 1270 | |
| 1271 | uschar *frozen_by = NULL; |
| 1272 | uschar *queued_by = NULL; |
| 1273 | |
| 1274 | uschar *errmsg, *s; |
| 1275 | struct stat statbuf; |
| 1276 | |
| 1277 | /* Final message to give to SMTP caller */ |
| 1278 | |
| 1279 | uschar *smtp_reply = NULL; |
| 1280 | |
| 1281 | /* Working header pointers */ |
| 1282 | |
| 1283 | header_line *h, *next; |
| 1284 | |
| 1285 | /* Flags for noting the existence of certain headers */ |
| 1286 | |
| 1287 | /**** No longer check for these (Nov 2003) |
| 1288 | BOOL to_or_cc_header_exists = FALSE; |
| 1289 | BOOL bcc_header_exists = FALSE; |
| 1290 | ****/ |
| 1291 | |
| 1292 | BOOL date_header_exists = FALSE; |
| 1293 | |
| 1294 | /* Pointers to receive the addresses of headers whose contents we need. */ |
| 1295 | |
| 1296 | header_line *from_header = NULL; |
| 1297 | header_line *subject_header = NULL; |
| 1298 | header_line *msgid_header = NULL; |
| 1299 | header_line *received_header; |
| 1300 | |
| 1301 | /* Variables for use when building the Received: header. */ |
| 1302 | |
| 1303 | uschar *received; |
| 1304 | uschar *timestamp; |
| 1305 | int tslen; |
| 1306 | |
| 1307 | /* Release any open files that might have been cached while preparing to |
| 1308 | accept the message - e.g. by verifying addresses - because reading a message |
| 1309 | might take a fair bit of real time. */ |
| 1310 | |
| 1311 | search_tidyup(); |
| 1312 | |
| 1313 | /* Initialize the chain of headers by setting up a place-holder for Received: |
| 1314 | header. Temporarily mark it as "old", i.e. not to be used. We keep header_last |
| 1315 | pointing to the end of the chain to make adding headers simple. */ |
| 1316 | |
| 1317 | received_header = header_list = header_last = store_get(sizeof(header_line)); |
| 1318 | header_list->next = NULL; |
| 1319 | header_list->type = htype_old; |
| 1320 | header_list->text = NULL; |
| 1321 | header_list->slen = 0; |
| 1322 | |
| 1323 | /* Control block for the next header to be read. */ |
| 1324 | |
| 1325 | next = store_get(sizeof(header_line)); |
| 1326 | next->text = store_get(header_size); |
| 1327 | |
| 1328 | /* Initialize message id to be null (indicating no message read), and the |
| 1329 | header names list to be the normal list. Indicate there is no data file open |
| 1330 | yet, initialize the size and warning count, and deal with no size limit. */ |
| 1331 | |
| 1332 | message_id[0] = 0; |
| 1333 | data_file = NULL; |
| 1334 | data_fd = -1; |
| 1335 | spool_name[0] = 0; |
| 1336 | message_size = 0; |
| 1337 | warning_count = 0; |
| 1338 | received_count = 1; /* For the one we will add */ |
| 1339 | |
| 1340 | if (thismessage_size_limit <= 0) thismessage_size_limit = INT_MAX; |
| 1341 | |
| 1342 | /* While reading the message, the following counts are computed. */ |
| 1343 | |
| 1344 | message_linecount = body_linecount = body_zerocount = 0; |
| 1345 | |
| 1346 | #ifdef EXPERIMENTAL_DOMAINKEYS |
| 1347 | /* Call into DK to set up the context. Check if DK is to be run are carried out |
| 1348 | inside dk_exim_verify_init(). */ |
| 1349 | dk_exim_verify_init(); |
| 1350 | #endif |
| 1351 | |
| 1352 | /* Remember the time of reception. Exim uses time+pid for uniqueness of message |
| 1353 | ids, and fractions of a second are required. See the comments that precede the |
| 1354 | message id creation below. */ |
| 1355 | |
| 1356 | (void)gettimeofday(&message_id_tv, NULL); |
| 1357 | |
| 1358 | /* For other uses of the received time we can operate with granularity of one |
| 1359 | second, and for that we use the global variable received_time. This is for |
| 1360 | things like ultimate message timeouts. */ |
| 1361 | |
| 1362 | received_time = message_id_tv.tv_sec; |
| 1363 | |
| 1364 | /* If SMTP input, set the special handler for timeouts. The alarm() calls |
| 1365 | happen in the smtp_getc() function when it refills its buffer. */ |
| 1366 | |
| 1367 | if (smtp_input) os_non_restarting_signal(SIGALRM, data_timeout_handler); |
| 1368 | |
| 1369 | /* If not SMTP input, timeout happens only if configured, and we just set a |
| 1370 | single timeout for the whole message. */ |
| 1371 | |
| 1372 | else if (receive_timeout > 0) |
| 1373 | { |
| 1374 | os_non_restarting_signal(SIGALRM, data_timeout_handler); |
| 1375 | alarm(receive_timeout); |
| 1376 | } |
| 1377 | |
| 1378 | /* SIGTERM and SIGINT are caught always. */ |
| 1379 | |
| 1380 | signal(SIGTERM, data_sigterm_sigint_handler); |
| 1381 | signal(SIGINT, data_sigterm_sigint_handler); |
| 1382 | |
| 1383 | /* Header lines in messages are not supposed to be very long, though when |
| 1384 | unfolded, to: and cc: headers can take up a lot of store. We must also cope |
| 1385 | with the possibility of junk being thrown at us. Start by getting 256 bytes for |
| 1386 | storing the header, and extend this as necessary using string_cat(). |
| 1387 | |
| 1388 | To cope with total lunacies, impose an upper limit on the length of the header |
| 1389 | section of the message, as otherwise the store will fill up. We must also cope |
| 1390 | with the possibility of binary zeros in the data. Hence we cannot use fgets(). |
| 1391 | Folded header lines are joined into one string, leaving the '\n' characters |
| 1392 | inside them, so that writing them out reproduces the input. |
| 1393 | |
| 1394 | Loop for each character of each header; the next structure for chaining the |
| 1395 | header is set up already, with ptr the offset of the next character in |
| 1396 | next->text. */ |
| 1397 | |
| 1398 | for (;;) |
| 1399 | { |
| 1400 | int ch = (RECEIVE_GETC)(); |
| 1401 | |
| 1402 | /* If we hit EOF on a SMTP connection, it's an error, since incoming |
| 1403 | SMTP must have a correct "." terminator. */ |
| 1404 | |
| 1405 | if (ch == EOF && smtp_input /* && !smtp_batched_input */) |
| 1406 | { |
| 1407 | smtp_reply = handle_lost_connection(US" (header)"); |
| 1408 | smtp_yield = FALSE; |
| 1409 | goto TIDYUP; /* Skip to end of function */ |
| 1410 | } |
| 1411 | |
| 1412 | /* See if we are at the current header's size limit - there must be at least |
| 1413 | four bytes left. This allows for the new character plus a zero, plus two for |
| 1414 | extra insertions when we are playing games with dots and carriage returns. If |
| 1415 | we are at the limit, extend the text buffer. This could have been done |
| 1416 | automatically using string_cat() but because this is a tightish loop storing |
| 1417 | only one character at a time, we choose to do it inline. Normally |
| 1418 | store_extend() will be able to extend the block; only at the end of a big |
| 1419 | store block will a copy be needed. To handle the case of very long headers |
| 1420 | (and sometimes lunatic messages can have ones that are 100s of K long) we |
| 1421 | call store_release() for strings that have been copied - if the string is at |
| 1422 | the start of a block (and therefore the only thing in it, because we aren't |
| 1423 | doing any other gets), the block gets freed. We can only do this because we |
| 1424 | know there are no other calls to store_get() going on. */ |
| 1425 | |
| 1426 | if (ptr >= header_size - 4) |
| 1427 | { |
| 1428 | int oldsize = header_size; |
| 1429 | /* header_size += 256; */ |
| 1430 | header_size *= 2; |
| 1431 | if (!store_extend(next->text, oldsize, header_size)) |
| 1432 | { |
| 1433 | uschar *newtext = store_get(header_size); |
| 1434 | memcpy(newtext, next->text, ptr); |
| 1435 | store_release(next->text); |
| 1436 | next->text = newtext; |
| 1437 | } |
| 1438 | } |
| 1439 | |
| 1440 | /* Cope with receiving a binary zero. There is dispute about whether |
| 1441 | these should be allowed in RFC 822 messages. The middle view is that they |
| 1442 | should not be allowed in headers, at least. Exim takes this attitude at |
| 1443 | the moment. We can't just stomp on them here, because we don't know that |
| 1444 | this line is a header yet. Set a flag to cause scanning later. */ |
| 1445 | |
| 1446 | if (ch == 0) had_zero++; |
| 1447 | |
| 1448 | /* Test for termination. Lines in remote SMTP are terminated by CRLF, while |
| 1449 | those from data files use just LF. Treat LF in local SMTP input as a |
| 1450 | terminator too. Treat EOF as a line terminator always. */ |
| 1451 | |
| 1452 | if (ch == EOF) goto EOL; |
| 1453 | |
| 1454 | /* FUDGE: There are sites out there that don't send CRs before their LFs, and |
| 1455 | other MTAs accept this. We are therefore forced into this "liberalisation" |
| 1456 | too, so we accept LF as a line terminator whatever the source of the message. |
| 1457 | However, if the first line of the message ended with a CRLF, we treat a bare |
| 1458 | LF specially by inserting a white space after it to ensure that the header |
| 1459 | line is not terminated. */ |
| 1460 | |
| 1461 | if (ch == '\n') |
| 1462 | { |
| 1463 | if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = FALSE; |
| 1464 | else if (first_line_ended_crlf) RECEIVE_UNGETC(' '); |
| 1465 | goto EOL; |
| 1466 | } |
| 1467 | |
| 1468 | /* This is not the end of the line. If this is SMTP input and this is |
| 1469 | the first character in the line and it is a "." character, ignore it. |
| 1470 | This implements the dot-doubling rule, though header lines starting with |
| 1471 | dots aren't exactly common. They are legal in RFC 822, though. If the |
| 1472 | following is CRLF or LF, this is the line that that terminates the |
| 1473 | entire message. We set message_ended to indicate this has happened (to |
| 1474 | prevent further reading), and break out of the loop, having freed the |
| 1475 | empty header, and set next = NULL to indicate no data line. */ |
| 1476 | |
| 1477 | if (ptr == 0 && ch == '.' && (smtp_input || dot_ends)) |
| 1478 | { |
| 1479 | ch = (RECEIVE_GETC)(); |
| 1480 | if (ch == '\r') |
| 1481 | { |
| 1482 | ch = (RECEIVE_GETC)(); |
| 1483 | if (ch != '\n') |
| 1484 | { |
| 1485 | RECEIVE_UNGETC(ch); |
| 1486 | ch = '\r'; /* Revert to CR */ |
| 1487 | } |
| 1488 | } |
| 1489 | if (ch == '\n') |
| 1490 | { |
| 1491 | message_ended = END_DOT; |
| 1492 | store_reset(next); |
| 1493 | next = NULL; |
| 1494 | break; /* End character-reading loop */ |
| 1495 | } |
| 1496 | |
| 1497 | /* For non-SMTP input, the dot at the start of the line was really a data |
| 1498 | character. What is now in ch is the following character. We guaranteed |
| 1499 | enough space for this above. */ |
| 1500 | |
| 1501 | if (!smtp_input) |
| 1502 | { |
| 1503 | next->text[ptr++] = '.'; |
| 1504 | message_size++; |
| 1505 | } |
| 1506 | } |
| 1507 | |
| 1508 | /* If CR is immediately followed by LF, end the line, ignoring the CR, and |
| 1509 | remember this case if this is the first line ending. */ |
| 1510 | |
| 1511 | if (ch == '\r') |
| 1512 | { |
| 1513 | ch = (RECEIVE_GETC)(); |
| 1514 | if (ch == '\n') |
| 1515 | { |
| 1516 | if (first_line_ended_crlf == TRUE_UNSET) first_line_ended_crlf = TRUE; |
| 1517 | goto EOL; |
| 1518 | } |
| 1519 | |
| 1520 | /* Otherwise, put back the character after CR, and turn the bare CR |
| 1521 | into LF SP. */ |
| 1522 | |
| 1523 | ch = (RECEIVE_UNGETC)(ch); |
| 1524 | next->text[ptr++] = '\n'; |
| 1525 | message_size++; |
| 1526 | ch = ' '; |
| 1527 | } |
| 1528 | |
| 1529 | /* We have a data character for the header line. */ |
| 1530 | |
| 1531 | next->text[ptr++] = ch; /* Add to buffer */ |
| 1532 | message_size++; /* Total message size so far */ |
| 1533 | |
| 1534 | /* Handle failure due to a humungously long header section. The >= allows |
| 1535 | for the terminating \n. Add what we have so far onto the headers list so |
| 1536 | that it gets reflected in any error message, and back up the just-read |
| 1537 | character. */ |
| 1538 | |
| 1539 | if (message_size >= header_maxsize) |
| 1540 | { |
| 1541 | next->text[ptr] = 0; |
| 1542 | next->slen = ptr; |
| 1543 | next->type = htype_other; |
| 1544 | next->next = NULL; |
| 1545 | header_last->next = next; |
| 1546 | header_last = next; |
| 1547 | |
| 1548 | log_write(0, LOG_MAIN, "ridiculously long message header received from " |
| 1549 | "%s (more than %d characters): message abandoned", |
| 1550 | sender_host_unknown? sender_ident : sender_fullhost, header_maxsize); |
| 1551 | |
| 1552 | if (smtp_input) |
| 1553 | { |
| 1554 | smtp_reply = US"552 Message header is ridiculously long"; |
| 1555 | receive_swallow_smtp(); |
| 1556 | goto TIDYUP; /* Skip to end of function */ |
| 1557 | } |
| 1558 | |
| 1559 | else |
| 1560 | { |
| 1561 | give_local_error(ERRMESS_VLONGHEADER, |
| 1562 | string_sprintf("message header longer than %d characters received: " |
| 1563 | "message not accepted", header_maxsize), US"", error_rc, stdin, |
| 1564 | header_list->next); |
| 1565 | /* Does not return */ |
| 1566 | } |
| 1567 | } |
| 1568 | |
| 1569 | continue; /* With next input character */ |
| 1570 | |
| 1571 | /* End of header line reached */ |
| 1572 | |
| 1573 | EOL: |
| 1574 | |
| 1575 | /* Keep track of lines for BSMTP errors and overall message_linecount. */ |
| 1576 | |
| 1577 | receive_linecount++; |
| 1578 | message_linecount++; |
| 1579 | |
| 1580 | /* Now put in the terminating newline. There is always space for |
| 1581 | at least two more characters. */ |
| 1582 | |
| 1583 | next->text[ptr++] = '\n'; |
| 1584 | message_size++; |
| 1585 | |
| 1586 | /* A blank line signals the end of the headers; release the unwanted |
| 1587 | space and set next to NULL to indicate this. */ |
| 1588 | |
| 1589 | if (ptr == 1) |
| 1590 | { |
| 1591 | store_reset(next); |
| 1592 | next = NULL; |
| 1593 | break; |
| 1594 | } |
| 1595 | |
| 1596 | /* There is data in the line; see if the next input character is a |
| 1597 | whitespace character. If it is, we have a continuation of this header line. |
| 1598 | There is always space for at least one character at this point. */ |
| 1599 | |
| 1600 | if (ch != EOF) |
| 1601 | { |
| 1602 | int nextch = (RECEIVE_GETC)(); |
| 1603 | if (nextch == ' ' || nextch == '\t') |
| 1604 | { |
| 1605 | next->text[ptr++] = nextch; |
| 1606 | message_size++; |
| 1607 | continue; /* Iterate the loop */ |
| 1608 | } |
| 1609 | else if (nextch != EOF) (RECEIVE_UNGETC)(nextch); /* For next time */ |
| 1610 | else ch = EOF; /* Cause main loop to exit at end */ |
| 1611 | } |
| 1612 | |
| 1613 | /* We have got to the real line end. Terminate the string and release store |
| 1614 | beyond it. If it turns out to be a real header, internal binary zeros will |
| 1615 | be squashed later. */ |
| 1616 | |
| 1617 | next->text[ptr] = 0; |
| 1618 | next->slen = ptr; |
| 1619 | store_reset(next->text + ptr + 1); |
| 1620 | |
| 1621 | /* Check the running total size against the overall message size limit. We |
| 1622 | don't expect to fail here, but if the overall limit is set less than MESSAGE_ |
| 1623 | MAXSIZE and a big header is sent, we want to catch it. Just stop reading |
| 1624 | headers - the code to read the body will then also hit the buffer. */ |
| 1625 | |
| 1626 | if (message_size > thismessage_size_limit) break; |
| 1627 | |
| 1628 | /* A line that is not syntactically correct for a header also marks |
| 1629 | the end of the headers. In this case, we leave next containing the |
| 1630 | first data line. This might actually be several lines because of the |
| 1631 | continuation logic applied above, but that doesn't matter. |
| 1632 | |
| 1633 | It turns out that smail, and presumably sendmail, accept leading lines |
| 1634 | of the form |
| 1635 | |
| 1636 | From ph10 Fri Jan 5 12:35 GMT 1996 |
| 1637 | |
| 1638 | in messages. The "mail" command on Solaris 2 sends such lines. I cannot |
| 1639 | find any documentation of this, but for compatibility it had better be |
| 1640 | accepted. Exim restricts it to the case of non-smtp messages, and |
| 1641 | treats it as an alternative to the -f command line option. Thus it is |
| 1642 | ignored except for trusted users or filter testing. Otherwise it is taken |
| 1643 | as the sender address, unless -f was used (sendmail compatibility). |
| 1644 | |
| 1645 | It further turns out that some UUCPs generate the From_line in a different |
| 1646 | format, e.g. |
| 1647 | |
| 1648 | From ph10 Fri, 7 Jan 97 14:00:00 GMT |
| 1649 | |
| 1650 | The regex for matching these things is now capable of recognizing both |
| 1651 | formats (including 2- and 4-digit years in the latter). In fact, the regex |
| 1652 | is now configurable, as is the expansion string to fish out the sender. |
| 1653 | |
| 1654 | Even further on it has been discovered that some broken clients send |
| 1655 | these lines in SMTP messages. There is now an option to ignore them from |
| 1656 | specified hosts or networks. Sigh. */ |
| 1657 | |
| 1658 | if (header_last == header_list && |
| 1659 | (!smtp_input |
| 1660 | || |
| 1661 | (sender_host_address != NULL && |
| 1662 | verify_check_host(&ignore_fromline_hosts) == OK) |
| 1663 | || |
| 1664 | (sender_host_address == NULL && ignore_fromline_local) |
| 1665 | ) && |
| 1666 | regex_match_and_setup(regex_From, next->text, 0, -1)) |
| 1667 | { |
| 1668 | if (!sender_address_forced) |
| 1669 | { |
| 1670 | uschar *uucp_sender = expand_string(uucp_from_sender); |
| 1671 | if (uucp_sender == NULL) |
| 1672 | { |
| 1673 | log_write(0, LOG_MAIN|LOG_PANIC, |
| 1674 | "expansion of \"%s\" failed after matching " |
| 1675 | "\"From \" line: %s", uucp_from_sender, expand_string_message); |
| 1676 | } |
| 1677 | else |
| 1678 | { |
| 1679 | int start, end, domain; |
| 1680 | uschar *errmess; |
| 1681 | uschar *newsender = parse_extract_address(uucp_sender, &errmess, |
| 1682 | &start, &end, &domain, TRUE); |
| 1683 | if (newsender != NULL) |
| 1684 | { |
| 1685 | if (domain == 0 && newsender[0] != 0) |
| 1686 | newsender = rewrite_address_qualify(newsender, FALSE); |
| 1687 | |
| 1688 | if (filter_test != FTEST_NONE || receive_check_set_sender(newsender)) |
| 1689 | { |
| 1690 | sender_address = newsender; |
| 1691 | |
| 1692 | if (trusted_caller || filter_test != FTEST_NONE) |
| 1693 | { |
| 1694 | authenticated_sender = NULL; |
| 1695 | originator_name = US""; |
| 1696 | sender_local = FALSE; |
| 1697 | } |
| 1698 | |
| 1699 | if (filter_test != FTEST_NONE) |
| 1700 | printf("Sender taken from \"From \" line\n"); |
| 1701 | } |
| 1702 | } |
| 1703 | } |
| 1704 | } |
| 1705 | } |
| 1706 | |
| 1707 | /* Not a leading "From " line. Check to see if it is a valid header line. |
| 1708 | Header names may contain any non-control characters except space and colon, |
| 1709 | amazingly. */ |
| 1710 | |
| 1711 | else |
| 1712 | { |
| 1713 | uschar *p = next->text; |
| 1714 | |
| 1715 | /* If not a valid header line, break from the header reading loop, leaving |
| 1716 | next != NULL, indicating that it holds the first line of the body. */ |
| 1717 | |
| 1718 | if (isspace(*p)) break; |
| 1719 | while (mac_isgraph(*p) && *p != ':') p++; |
| 1720 | while (isspace(*p)) p++; |
| 1721 | if (*p != ':') |
| 1722 | { |
| 1723 | body_zerocount = had_zero; |
| 1724 | break; |
| 1725 | } |
| 1726 | |
| 1727 | /* We have a valid header line. If there were any binary zeroes in |
| 1728 | the line, stomp on them here. */ |
| 1729 | |
| 1730 | if (had_zero > 0) |
| 1731 | for (p = next->text; p < next->text + ptr; p++) if (*p == 0) *p = '?'; |
| 1732 | |
| 1733 | /* It is perfectly legal to have an empty continuation line |
| 1734 | at the end of a header, but it is confusing to humans |
| 1735 | looking at such messages, since it looks like a blank line. |
| 1736 | Reduce confusion by removing redundant white space at the |
| 1737 | end. We know that there is at least one printing character |
| 1738 | (the ':' tested for above) so there is no danger of running |
| 1739 | off the end. */ |
| 1740 | |
| 1741 | p = next->text + ptr - 2; |
| 1742 | for (;;) |
| 1743 | { |
| 1744 | while (*p == ' ' || *p == '\t') p--; |
| 1745 | if (*p != '\n') break; |
| 1746 | ptr = (p--) - next->text + 1; |
| 1747 | message_size -= next->slen - ptr; |
| 1748 | next->text[ptr] = 0; |
| 1749 | next->slen = ptr; |
| 1750 | } |
| 1751 | |
| 1752 | /* Add the header to the chain */ |
| 1753 | |
| 1754 | next->type = htype_other; |
| 1755 | next->next = NULL; |
| 1756 | header_last->next = next; |
| 1757 | header_last = next; |
| 1758 | |
| 1759 | /* Check the limit for individual line lengths. This comes after adding to |
| 1760 | the chain so that the failing line is reflected if a bounce is generated |
| 1761 | (for a local message). */ |
| 1762 | |
| 1763 | if (header_line_maxsize > 0 && next->slen > header_line_maxsize) |
| 1764 | { |
| 1765 | log_write(0, LOG_MAIN, "overlong message header line received from " |
| 1766 | "%s (more than %d characters): message abandoned", |
| 1767 | sender_host_unknown? sender_ident : sender_fullhost, |
| 1768 | header_line_maxsize); |
| 1769 | |
| 1770 | if (smtp_input) |
| 1771 | { |
| 1772 | smtp_reply = US"552 A message header line is too long"; |
| 1773 | receive_swallow_smtp(); |
| 1774 | goto TIDYUP; /* Skip to end of function */ |
| 1775 | } |
| 1776 | |
| 1777 | else |
| 1778 | { |
| 1779 | give_local_error(ERRMESS_VLONGHDRLINE, |
| 1780 | string_sprintf("message header line longer than %d characters " |
| 1781 | "received: message not accepted", header_line_maxsize), US"", |
| 1782 | error_rc, stdin, header_list->next); |
| 1783 | /* Does not return */ |
| 1784 | } |
| 1785 | } |
| 1786 | |
| 1787 | /* Note if any resent- fields exist. */ |
| 1788 | |
| 1789 | if (!resents_exist && strncmpic(next->text, US"resent-", 7) == 0) |
| 1790 | { |
| 1791 | resents_exist = TRUE; |
| 1792 | resent_prefix = US"Resent-"; |
| 1793 | } |
| 1794 | } |
| 1795 | |
| 1796 | /* The line has been handled. If we have hit EOF, break out of the loop, |
| 1797 | indicating no pending data line. */ |
| 1798 | |
| 1799 | if (ch == EOF) { next = NULL; break; } |
| 1800 | |
| 1801 | /* Set up for the next header */ |
| 1802 | |
| 1803 | header_size = 256; |
| 1804 | next = store_get(sizeof(header_line)); |
| 1805 | next->text = store_get(header_size); |
| 1806 | ptr = 0; |
| 1807 | had_zero = 0; |
| 1808 | } /* Continue, starting to read the next header */ |
| 1809 | |
| 1810 | /* At this point, we have read all the headers into a data structure in main |
| 1811 | store. The first header is still the dummy placeholder for the Received: header |
| 1812 | we are going to generate a bit later on. If next != NULL, it contains the first |
| 1813 | data line - which terminated the headers before reaching a blank line (not the |
| 1814 | normal case). */ |
| 1815 | |
| 1816 | DEBUG(D_receive) |
| 1817 | { |
| 1818 | debug_printf(">>Headers received:\n"); |
| 1819 | for (h = header_list->next; h != NULL; h = h->next) |
| 1820 | debug_printf("%s", h->text); |
| 1821 | debug_printf("\n"); |
| 1822 | } |
| 1823 | |
| 1824 | /* End of file on any SMTP connection is an error. If an incoming SMTP call |
| 1825 | is dropped immediately after valid headers, the next thing we will see is EOF. |
| 1826 | We must test for this specially, as further down the reading of the data is |
| 1827 | skipped if already at EOF. */ |
| 1828 | |
| 1829 | if (smtp_input && (receive_feof)()) |
| 1830 | { |
| 1831 | smtp_reply = handle_lost_connection(US" (after header)"); |
| 1832 | smtp_yield = FALSE; |
| 1833 | goto TIDYUP; /* Skip to end of function */ |
| 1834 | } |
| 1835 | |
| 1836 | /* If this is a filter test run and no headers were read, output a warning |
| 1837 | in case there is a mistake in the test message. */ |
| 1838 | |
| 1839 | if (filter_test != FTEST_NONE && header_list->next == NULL) |
| 1840 | printf("Warning: no message headers read\n"); |
| 1841 | |
| 1842 | |
| 1843 | /* Scan the headers to identify them. Some are merely marked for later |
| 1844 | processing; some are dealt with here. */ |
| 1845 | |
| 1846 | for (h = header_list->next; h != NULL; h = h->next) |
| 1847 | { |
| 1848 | BOOL is_resent = strncmpic(h->text, US"resent-", 7) == 0; |
| 1849 | if (is_resent) contains_resent_headers = TRUE; |
| 1850 | |
| 1851 | switch (header_checkname(h, is_resent)) |
| 1852 | { |
| 1853 | /* "Bcc:" gets flagged, and its existence noted, whether it's resent- or |
| 1854 | not. */ |
| 1855 | |
| 1856 | case htype_bcc: |
| 1857 | h->type = htype_bcc; |
| 1858 | /**** |
| 1859 | bcc_header_exists = TRUE; |
| 1860 | ****/ |
| 1861 | break; |
| 1862 | |
| 1863 | /* "Cc:" gets flagged, and the existence of a recipient header is noted, |
| 1864 | whether it's resent- or not. */ |
| 1865 | |
| 1866 | case htype_cc: |
| 1867 | h->type = htype_cc; |
| 1868 | /**** |
| 1869 | to_or_cc_header_exists = TRUE; |
| 1870 | ****/ |
| 1871 | break; |
| 1872 | |
| 1873 | /* Record whether a Date: or Resent-Date: header exists, as appropriate. */ |
| 1874 | |
| 1875 | case htype_date: |
| 1876 | date_header_exists = !resents_exist || is_resent; |
| 1877 | break; |
| 1878 | |
| 1879 | /* Same comments as about Return-Path: below. */ |
| 1880 | |
| 1881 | case htype_delivery_date: |
| 1882 | if (delivery_date_remove) h->type = htype_old; |
| 1883 | break; |
| 1884 | |
| 1885 | /* Same comments as about Return-Path: below. */ |
| 1886 | |
| 1887 | case htype_envelope_to: |
| 1888 | if (envelope_to_remove) h->type = htype_old; |
| 1889 | break; |
| 1890 | |
| 1891 | /* Mark all "From:" headers so they get rewritten. Save the one that is to |
| 1892 | be used for Sender: checking. For Sendmail compatibility, if the "From:" |
| 1893 | header consists of just the login id of the user who called Exim, rewrite |
| 1894 | it with the gecos field first. Apply this rule to Resent-From: if there |
| 1895 | are resent- fields. */ |
| 1896 | |
| 1897 | case htype_from: |
| 1898 | h->type = htype_from; |
| 1899 | if (!resents_exist || is_resent) |
| 1900 | { |
| 1901 | from_header = h; |
| 1902 | if (!smtp_input) |
| 1903 | { |
| 1904 | uschar *s = Ustrchr(h->text, ':') + 1; |
| 1905 | while (isspace(*s)) s++; |
| 1906 | if (strncmpic(s, originator_login, h->slen - (s - h->text) - 1) == 0) |
| 1907 | { |
| 1908 | uschar *name = is_resent? US"Resent-From" : US"From"; |
| 1909 | header_add(htype_from, "%s: %s <%s@%s>\n", name, originator_name, |
| 1910 | originator_login, qualify_domain_sender); |
| 1911 | from_header = header_last; |
| 1912 | h->type = htype_old; |
| 1913 | DEBUG(D_receive|D_rewrite) |
| 1914 | debug_printf("rewrote \"%s:\" header using gecos\n", name); |
| 1915 | } |
| 1916 | } |
| 1917 | } |
| 1918 | break; |
| 1919 | |
| 1920 | /* Identify the Message-id: header for generating "in-reply-to" in the |
| 1921 | autoreply transport. For incoming logging, save any resent- value. In both |
| 1922 | cases, take just the first of any multiples. */ |
| 1923 | |
| 1924 | case htype_id: |
| 1925 | if (msgid_header == NULL && (!resents_exist || is_resent)) |
| 1926 | { |
| 1927 | msgid_header = h; |
| 1928 | h->type = htype_id; |
| 1929 | } |
| 1930 | break; |
| 1931 | |
| 1932 | /* Flag all Received: headers */ |
| 1933 | |
| 1934 | case htype_received: |
| 1935 | h->type = htype_received; |
| 1936 | received_count++; |
| 1937 | break; |
| 1938 | |
| 1939 | /* "Reply-to:" is just noted (there is no resent-reply-to field) */ |
| 1940 | |
| 1941 | case htype_reply_to: |
| 1942 | h->type = htype_reply_to; |
| 1943 | break; |
| 1944 | |
| 1945 | /* The Return-path: header is supposed to be added to messages when |
| 1946 | they leave the SMTP system. We shouldn't receive messages that already |
| 1947 | contain Return-path. However, since Exim generates Return-path: on |
| 1948 | local delivery, resent messages may well contain it. We therefore |
| 1949 | provide an option (which defaults on) to remove any Return-path: headers |
| 1950 | on input. Removal actually means flagging as "old", which prevents the |
| 1951 | header being transmitted with the message. */ |
| 1952 | |
| 1953 | case htype_return_path: |
| 1954 | if (return_path_remove) h->type = htype_old; |
| 1955 | |
| 1956 | /* If we are testing a mail filter file, use the value of the |
| 1957 | Return-Path: header to set up the return_path variable, which is not |
| 1958 | otherwise set. However, remove any <> that surround the address |
| 1959 | because the variable doesn't have these. */ |
| 1960 | |
| 1961 | if (filter_test != FTEST_NONE) |
| 1962 | { |
| 1963 | uschar *start = h->text + 12; |
| 1964 | uschar *end = start + Ustrlen(start); |
| 1965 | while (isspace(*start)) start++; |
| 1966 | while (end > start && isspace(end[-1])) end--; |
| 1967 | if (*start == '<' && end[-1] == '>') |
| 1968 | { |
| 1969 | start++; |
| 1970 | end--; |
| 1971 | } |
| 1972 | return_path = string_copyn(start, end - start); |
| 1973 | printf("Return-path taken from \"Return-path:\" header line\n"); |
| 1974 | } |
| 1975 | break; |
| 1976 | |
| 1977 | /* If there is a "Sender:" header and the message is locally originated, |
| 1978 | and from an untrusted caller, or if we are in submission mode for a remote |
| 1979 | message, mark it "old" so that it will not be transmitted with the message, |
| 1980 | unless active_local_sender_retain is set. (This can only be true if |
| 1981 | active_local_from_check is false.) If there are any resent- headers in the |
| 1982 | message, apply this rule to Resent-Sender: instead of Sender:. Messages |
| 1983 | with multiple resent- header sets cannot be tidily handled. (For this |
| 1984 | reason, at least one MUA - Pine - turns old resent- headers into X-resent- |
| 1985 | headers when resending, leaving just one set.) */ |
| 1986 | |
| 1987 | case htype_sender: |
| 1988 | h->type = ((!active_local_sender_retain && |
| 1989 | ((sender_local && !trusted_caller) || submission_mode) |
| 1990 | ) && |
| 1991 | (!resents_exist||is_resent))? |
| 1992 | htype_old : htype_sender; |
| 1993 | break; |
| 1994 | |
| 1995 | /* Remember the Subject: header for logging. There is no Resent-Subject */ |
| 1996 | |
| 1997 | case htype_subject: |
| 1998 | subject_header = h; |
| 1999 | break; |
| 2000 | |
| 2001 | /* "To:" gets flagged, and the existence of a recipient header is noted, |
| 2002 | whether it's resent- or not. */ |
| 2003 | |
| 2004 | case htype_to: |
| 2005 | h->type = htype_to; |
| 2006 | /**** |
| 2007 | to_or_cc_header_exists = TRUE; |
| 2008 | ****/ |
| 2009 | break; |
| 2010 | } |
| 2011 | } |
| 2012 | |
| 2013 | /* Extract recipients from the headers if that is required (the -t option). |
| 2014 | Note that this is documented as being done *before* any address rewriting takes |
| 2015 | place. There are two possibilities: |
| 2016 | |
| 2017 | (1) According to sendmail documentation for Solaris, IRIX, and HP-UX, any |
| 2018 | recipients already listed are to be REMOVED from the message. Smail 3 works |
| 2019 | like this. We need to build a non-recipients tree for that list, because in |
| 2020 | subsequent processing this data is held in a tree and that's what the |
| 2021 | spool_write_header() function expects. Make sure that non-recipient addresses |
| 2022 | are fully qualified and rewritten if necessary. |
| 2023 | |
| 2024 | (2) According to other sendmail documentation, -t ADDS extracted recipients to |
| 2025 | those in the command line arguments (and it is rumoured some other MTAs do |
| 2026 | this). Therefore, there is an option to make Exim behave this way. |
| 2027 | |
| 2028 | *** Notes on "Resent-" header lines *** |
| 2029 | |
| 2030 | The presence of resent-headers in the message makes -t horribly ambiguous. |
| 2031 | Experiments with sendmail showed that it uses recipients for all resent- |
| 2032 | headers, totally ignoring the concept of "sets of resent- headers" as described |
| 2033 | in RFC 2822 section 3.6.6. Sendmail also amalgamates them into a single set |
| 2034 | with all the addresses in one instance of each header. |
| 2035 | |
| 2036 | This seems to me not to be at all sensible. Before release 4.20, Exim 4 gave an |
| 2037 | error for -t if there were resent- headers in the message. However, after a |
| 2038 | discussion on the mailing list, I've learned that there are MUAs that use |
| 2039 | resent- headers with -t, and also that the stuff about sets of resent- headers |
| 2040 | and their ordering in RFC 2822 is generally ignored. An MUA that submits a |
| 2041 | message with -t and resent- header lines makes sure that only *its* resent- |
| 2042 | headers are present; previous ones are often renamed as X-resent- for example. |
| 2043 | |
| 2044 | Consequently, Exim has been changed so that, if any resent- header lines are |
| 2045 | present, the recipients are taken from all of the appropriate resent- lines, |
| 2046 | and not from the ordinary To:, Cc:, etc. */ |
| 2047 | |
| 2048 | if (extract_recip) |
| 2049 | { |
| 2050 | int rcount = 0; |
| 2051 | error_block **bnext = &bad_addresses; |
| 2052 | |
| 2053 | if (extract_addresses_remove_arguments) |
| 2054 | { |
| 2055 | while (recipients_count-- > 0) |
| 2056 | { |
| 2057 | uschar *s = rewrite_address(recipients_list[recipients_count].address, |
| 2058 | TRUE, TRUE, global_rewrite_rules, rewrite_existflags); |
| 2059 | tree_add_nonrecipient(s); |
| 2060 | } |
| 2061 | recipients_list = NULL; |
| 2062 | recipients_count = recipients_list_max = 0; |
| 2063 | } |
| 2064 | |
| 2065 | parse_allow_group = TRUE; /* Allow address group syntax */ |
| 2066 | |
| 2067 | /* Now scan the headers */ |
| 2068 | |
| 2069 | for (h = header_list->next; h != NULL; h = h->next) |
| 2070 | { |
| 2071 | if ((h->type == htype_to || h->type == htype_cc || h->type == htype_bcc) && |
| 2072 | (!contains_resent_headers || strncmpic(h->text, US"resent-", 7) == 0)) |
| 2073 | { |
| 2074 | uschar *s = Ustrchr(h->text, ':') + 1; |
| 2075 | while (isspace(*s)) s++; |
| 2076 | |
| 2077 | while (*s != 0) |
| 2078 | { |
| 2079 | uschar *ss = parse_find_address_end(s, FALSE); |
| 2080 | uschar *recipient, *errmess, *p, *pp; |
| 2081 | int start, end, domain; |
| 2082 | |
| 2083 | /* Check on maximum */ |
| 2084 | |
| 2085 | if (recipients_max > 0 && ++rcount > recipients_max) |
| 2086 | { |
| 2087 | give_local_error(ERRMESS_TOOMANYRECIP, US"too many recipients", |
| 2088 | US"message rejected: ", error_rc, stdin, NULL); |
| 2089 | /* Does not return */ |
| 2090 | } |
| 2091 | |
| 2092 | /* Make a copy of the address, and remove any internal newlines. These |
| 2093 | may be present as a result of continuations of the header line. The |
| 2094 | white space that follows the newline must not be removed - it is part |
| 2095 | of the header. */ |
| 2096 | |
| 2097 | pp = recipient = store_get(ss - s + 1); |
| 2098 | for (p = s; p < ss; p++) if (*p != '\n') *pp++ = *p; |
| 2099 | *pp = 0; |
| 2100 | recipient = parse_extract_address(recipient, &errmess, &start, &end, |
| 2101 | &domain, FALSE); |
| 2102 | |
| 2103 | /* Keep a list of all the bad addresses so we can send a single |
| 2104 | error message at the end. However, an empty address is not an error; |
| 2105 | just ignore it. This can come from an empty group list like |
| 2106 | |
| 2107 | To: Recipients of list:; |
| 2108 | |
| 2109 | If there are no recipients at all, an error will occur later. */ |
| 2110 | |
| 2111 | if (recipient == NULL && Ustrcmp(errmess, "empty address") != 0) |
| 2112 | { |
| 2113 | int len = Ustrlen(s); |
| 2114 | error_block *b = store_get(sizeof(error_block)); |
| 2115 | while (len > 0 && isspace(s[len-1])) len--; |
| 2116 | b->next = NULL; |
| 2117 | b->text1 = string_printing(string_copyn(s, len)); |
| 2118 | b->text2 = errmess; |
| 2119 | *bnext = b; |
| 2120 | bnext = &(b->next); |
| 2121 | } |
| 2122 | |
| 2123 | /* If the recipient is already in the nonrecipients tree, it must |
| 2124 | have appeared on the command line with the option extract_addresses_ |
| 2125 | remove_arguments set. Do not add it to the recipients, and keep a note |
| 2126 | that this has happened, in order to give a better error if there are |
| 2127 | no recipients left. */ |
| 2128 | |
| 2129 | else if (recipient != NULL) |
| 2130 | { |
| 2131 | if (tree_search(tree_nonrecipients, recipient) == NULL) |
| 2132 | receive_add_recipient(recipient, -1); |
| 2133 | else |
| 2134 | extracted_ignored = TRUE; |
| 2135 | } |
| 2136 | |
| 2137 | /* Move on past this address */ |
| 2138 | |
| 2139 | s = ss + (*ss? 1:0); |
| 2140 | while (isspace(*s)) s++; |
| 2141 | } |
| 2142 | |
| 2143 | /* If this was the bcc: header, mark it "old", which means it |
| 2144 | will be kept on the spool, but not transmitted as part of the |
| 2145 | message. */ |
| 2146 | |
| 2147 | if (h->type == htype_bcc) |
| 2148 | { |
| 2149 | h->type = htype_old; |
| 2150 | /**** |
| 2151 | bcc_header_exists = FALSE; |
| 2152 | ****/ |
| 2153 | } |
| 2154 | } /* For appropriate header line */ |
| 2155 | } /* For each header line */ |
| 2156 | |
| 2157 | parse_allow_group = FALSE; /* Reset group syntax flags */ |
| 2158 | parse_found_group = FALSE; |
| 2159 | } |
| 2160 | |
| 2161 | /* Now build the unique message id. This has changed several times over the |
| 2162 | lifetime of Exim. This description was rewritten for Exim 4.14 (February 2003). |
| 2163 | Retaining all the history in the comment has become too unwieldy - read |
| 2164 | previous release sources if you want it. |
| 2165 | |
| 2166 | The message ID has 3 parts: tttttt-pppppp-ss. Each part is a number in base 62. |
| 2167 | The first part is the current time, in seconds. The second part is the current |
| 2168 | pid. Both are large enough to hold 32-bit numbers in base 62. The third part |
| 2169 | can hold a number in the range 0-3843. It used to be a computed sequence |
| 2170 | number, but is now the fractional component of the current time in units of |
| 2171 | 1/2000 of a second (i.e. a value in the range 0-1999). After a message has been |
| 2172 | received, Exim ensures that the timer has ticked at the appropriate level |
| 2173 | before proceeding, to avoid duplication if the pid happened to be re-used |
| 2174 | within the same time period. It seems likely that most messages will take at |
| 2175 | least half a millisecond to be received, so no delay will normally be |
| 2176 | necessary. At least for some time... |
| 2177 | |
| 2178 | There is a modification when localhost_number is set. Formerly this was allowed |
| 2179 | to be as large as 255. Now it is restricted to the range 0-16, and the final |
| 2180 | component of the message id becomes (localhost_number * 200) + fractional time |
| 2181 | in units of 1/200 of a second (i.e. a value in the range 0-3399). |
| 2182 | |
| 2183 | Some not-really-Unix operating systems use case-insensitive file names (Darwin, |
| 2184 | Cygwin). For these, we have to use base 36 instead of base 62. Luckily, this |
| 2185 | still allows the tttttt field to hold a large enough number to last for some |
| 2186 | more decades, and the final two-digit field can hold numbers up to 1295, which |
| 2187 | is enough for milliseconds (instead of 1/2000 of a second). |
| 2188 | |
| 2189 | However, the pppppp field cannot hold a 32-bit pid, but it can hold a 31-bit |
| 2190 | pid, so it is probably safe because pids have to be positive. The |
| 2191 | localhost_number is restricted to 0-10 for these hosts, and when it is set, the |
| 2192 | final field becomes (localhost_number * 100) + fractional time in centiseconds. |
| 2193 | |
| 2194 | Note that string_base62() returns its data in a static storage block, so it |
| 2195 | must be copied before calling string_base62() again. It always returns exactly |
| 2196 | 6 characters. |
| 2197 | |
| 2198 | There doesn't seem to be anything in the RFC which requires a message id to |
| 2199 | start with a letter, but Smail was changed to ensure this. The external form of |
| 2200 | the message id (as supplied by string expansion) therefore starts with an |
| 2201 | additional leading 'E'. The spool file names do not include this leading |
| 2202 | letter and it is not used internally. |
| 2203 | |
| 2204 | NOTE: If ever the format of message ids is changed, the regular expression for |
| 2205 | checking that a string is in this format must be updated in a corresponding |
| 2206 | way. It appears in the initializing code in exim.c. The macro MESSAGE_ID_LENGTH |
| 2207 | must also be changed to reflect the correct string length. Then, of course, |
| 2208 | other programs that rely on the message id format will need updating too. */ |
| 2209 | |
| 2210 | Ustrncpy(message_id, string_base62((long int)(message_id_tv.tv_sec)), 6); |
| 2211 | message_id[6] = '-'; |
| 2212 | Ustrncpy(message_id + 7, string_base62((long int)getpid()), 6); |
| 2213 | |
| 2214 | /* Deal with the case where the host number is set. The value of the number was |
| 2215 | checked when it was read, to ensure it isn't too big. The timing granularity is |
| 2216 | left in id_resolution so that an appropriate wait can be done after receiving |
| 2217 | the message, if necessary (we hope it won't be). */ |
| 2218 | |
| 2219 | if (host_number_string != NULL) |
| 2220 | { |
| 2221 | id_resolution = (BASE_62 == 62)? 5000 : 10000; |
| 2222 | sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s", |
| 2223 | string_base62((long int)( |
| 2224 | host_number * (1000000/id_resolution) + |
| 2225 | message_id_tv.tv_usec/id_resolution)) + 4); |
| 2226 | } |
| 2227 | |
| 2228 | /* Host number not set: final field is just the fractional time at an |
| 2229 | appropriate resolution. */ |
| 2230 | |
| 2231 | else |
| 2232 | { |
| 2233 | id_resolution = (BASE_62 == 62)? 500 : 1000; |
| 2234 | sprintf(CS(message_id + MESSAGE_ID_LENGTH - 3), "-%2s", |
| 2235 | string_base62((long int)(message_id_tv.tv_usec/id_resolution)) + 4); |
| 2236 | } |
| 2237 | |
| 2238 | /* Add the current message id onto the current process info string if |
| 2239 | it will fit. */ |
| 2240 | |
| 2241 | (void)string_format(process_info + process_info_len, |
| 2242 | PROCESS_INFO_SIZE - process_info_len, " id=%s", message_id); |
| 2243 | |
| 2244 | /* If we are using multiple input directories, set up the one for this message |
| 2245 | to be the least significant base-62 digit of the time of arrival. Otherwise |
| 2246 | ensure that it is an empty string. */ |
| 2247 | |
| 2248 | message_subdir[0] = split_spool_directory? message_id[5] : 0; |
| 2249 | |
| 2250 | /* Now that we have the message-id, if there is no message-id: header, generate |
| 2251 | one, but only for local or submission mode messages. This can be |
| 2252 | user-configured if required, but we had better flatten any illegal characters |
| 2253 | therein. */ |
| 2254 | |
| 2255 | if (msgid_header == NULL && (sender_host_address == NULL || submission_mode)) |
| 2256 | { |
| 2257 | uschar *p; |
| 2258 | uschar *id_text = US""; |
| 2259 | uschar *id_domain = primary_hostname; |
| 2260 | |
| 2261 | /* Permit only letters, digits, dots, and hyphens in the domain */ |
| 2262 | |
| 2263 | if (message_id_domain != NULL) |
| 2264 | { |
| 2265 | uschar *new_id_domain = expand_string(message_id_domain); |
| 2266 | if (new_id_domain == NULL) |
| 2267 | { |
| 2268 | if (!expand_string_forcedfail) |
| 2269 | log_write(0, LOG_MAIN|LOG_PANIC, |
| 2270 | "expansion of \"%s\" (message_id_header_domain) " |
| 2271 | "failed: %s", message_id_domain, expand_string_message); |
| 2272 | } |
| 2273 | else if (*new_id_domain != 0) |
| 2274 | { |
| 2275 | id_domain = new_id_domain; |
| 2276 | for (p = id_domain; *p != 0; p++) |
| 2277 | if (!isalnum(*p) && *p != '.') *p = '-'; /* No need to test '-' ! */ |
| 2278 | } |
| 2279 | } |
| 2280 | |
| 2281 | /* Permit all characters except controls and RFC 2822 specials in the |
| 2282 | additional text part. */ |
| 2283 | |
| 2284 | if (message_id_text != NULL) |
| 2285 | { |
| 2286 | uschar *new_id_text = expand_string(message_id_text); |
| 2287 | if (new_id_text == NULL) |
| 2288 | { |
| 2289 | if (!expand_string_forcedfail) |
| 2290 | log_write(0, LOG_MAIN|LOG_PANIC, |
| 2291 | "expansion of \"%s\" (message_id_header_text) " |
| 2292 | "failed: %s", message_id_text, expand_string_message); |
| 2293 | } |
| 2294 | else if (*new_id_text != 0) |
| 2295 | { |
| 2296 | id_text = new_id_text; |
| 2297 | for (p = id_text; *p != 0; p++) |
| 2298 | if (mac_iscntrl_or_special(*p)) *p = '-'; |
| 2299 | } |
| 2300 | } |
| 2301 | |
| 2302 | /* Add the header line */ |
| 2303 | |
| 2304 | header_add(htype_id, "%sMessage-Id: <%s%s%s@%s>\n", resent_prefix, |
| 2305 | message_id_external, (*id_text == 0)? "" : ".", id_text, id_domain); |
| 2306 | } |
| 2307 | |
| 2308 | /* If we are to log recipients, keep a copy of the raw ones before any possible |
| 2309 | rewriting. Must copy the count, because later ACLs and the local_scan() |
| 2310 | function may mess with the real recipients. */ |
| 2311 | |
| 2312 | if ((log_extra_selector & LX_received_recipients) != 0) |
| 2313 | { |
| 2314 | raw_recipients = store_get(recipients_count * sizeof(uschar *)); |
| 2315 | for (i = 0; i < recipients_count; i++) |
| 2316 | raw_recipients[i] = string_copy(recipients_list[i].address); |
| 2317 | raw_recipients_count = recipients_count; |
| 2318 | } |
| 2319 | |
| 2320 | /* Ensure the recipients list is fully qualified and rewritten. Unqualified |
| 2321 | recipients will get here only if the conditions were right (allow_unqualified_ |
| 2322 | recipient is TRUE). */ |
| 2323 | |
| 2324 | for (i = 0; i < recipients_count; i++) |
| 2325 | recipients_list[i].address = |
| 2326 | rewrite_address(recipients_list[i].address, TRUE, TRUE, |
| 2327 | global_rewrite_rules, rewrite_existflags); |
| 2328 | |
| 2329 | /* If there is no From: header, generate one for local or submission_mode |
| 2330 | messages. If there is no sender address, but the sender is local or this is a |
| 2331 | local delivery error, use the originator login. This shouldn't happen for |
| 2332 | genuine bounces, but might happen for autoreplies. The addition of From: must |
| 2333 | be done *before* checking for the possible addition of a Sender: header, |
| 2334 | because untrusted_set_sender allows an untrusted user to set anything in the |
| 2335 | envelope (which might then get info From:) but we still want to ensure a valid |
| 2336 | Sender: if it is required. */ |
| 2337 | |
| 2338 | if (from_header == NULL && (sender_host_address == NULL || submission_mode)) |
| 2339 | { |
| 2340 | /* Envelope sender is empty */ |
| 2341 | |
| 2342 | if (sender_address[0] == 0) |
| 2343 | { |
| 2344 | uschar *fromstart, *fromend; |
| 2345 | |
| 2346 | fromstart = string_sprintf("%sFrom: %s%s", resent_prefix, |
| 2347 | originator_name, (originator_name[0] == 0)? "" : " <"); |
| 2348 | fromend = (originator_name[0] == 0)? US"" : US">"; |
| 2349 | |
| 2350 | if (sender_local || local_error_message) |
| 2351 | { |
| 2352 | header_add(htype_from, "%s%s@%s%s\n", fromstart, |
| 2353 | local_part_quote(originator_login), qualify_domain_sender, |
| 2354 | fromend); |
| 2355 | } |
| 2356 | else if (submission_mode && authenticated_id != NULL) |
| 2357 | { |
| 2358 | if (submission_domain == NULL) |
| 2359 | { |
| 2360 | header_add(htype_from, "%s%s@%s%s\n", fromstart, |
| 2361 | local_part_quote(authenticated_id), qualify_domain_sender, |
| 2362 | fromend); |
| 2363 | } |
| 2364 | else if (submission_domain[0] == 0) /* empty => whole address set */ |
| 2365 | { |
| 2366 | header_add(htype_from, "%s%s%s\n", fromstart, authenticated_id, |
| 2367 | fromend); |
| 2368 | } |
| 2369 | else |
| 2370 | { |
| 2371 | header_add(htype_from, "%s%s@%s%s\n", fromstart, |
| 2372 | local_part_quote(authenticated_id), submission_domain, |
| 2373 | fromend); |
| 2374 | } |
| 2375 | from_header = header_last; /* To get it checked for Sender: */ |
| 2376 | } |
| 2377 | } |
| 2378 | |
| 2379 | /* There is a non-null envelope sender. Build the header using the original |
| 2380 | sender address, before any rewriting that might have been done while |
| 2381 | verifying it. */ |
| 2382 | |
| 2383 | else |
| 2384 | { |
| 2385 | header_add(htype_from, "%sFrom: %s%s%s%s\n", resent_prefix, |
| 2386 | originator_name, |
| 2387 | (originator_name[0] == 0)? "" : " <", |
| 2388 | (sender_address_unrewritten == NULL)? |
| 2389 | sender_address : sender_address_unrewritten, |
| 2390 | (originator_name[0] == 0)? "" : ">"); |
| 2391 | |
| 2392 | from_header = header_last; /* To get it checked for Sender: */ |
| 2393 | } |
| 2394 | } |
| 2395 | |
| 2396 | |
| 2397 | /* If the sender is local, or if we are in submission mode and there is an |
| 2398 | authenticated_id, check that an existing From: is correct, and if not, generate |
| 2399 | a Sender: header, unless disabled. Any previously-existing Sender: header was |
| 2400 | removed above. Note that sender_local, as well as being TRUE if the caller of |
| 2401 | exim is not trusted, is also true if a trusted caller did not supply a -f |
| 2402 | argument for non-smtp input. To allow trusted callers to forge From: without |
| 2403 | supplying -f, we have to test explicitly here. If the From: header contains |
| 2404 | more than one address, then the call to parse_extract_address fails, and a |
| 2405 | Sender: header is inserted, as required. */ |
| 2406 | |
| 2407 | if (from_header != NULL && |
| 2408 | (active_local_from_check && |
| 2409 | ((sender_local && !trusted_caller) || |
| 2410 | (submission_mode && authenticated_id != NULL)) |
| 2411 | )) |
| 2412 | { |
| 2413 | BOOL make_sender = TRUE; |
| 2414 | int start, end, domain; |
| 2415 | uschar *errmess; |
| 2416 | uschar *from_address = |
| 2417 | parse_extract_address(Ustrchr(from_header->text, ':') + 1, &errmess, |
| 2418 | &start, &end, &domain, FALSE); |
| 2419 | uschar *generated_sender_address; |
| 2420 | |
| 2421 | if (submission_mode) |
| 2422 | { |
| 2423 | if (submission_domain == NULL) |
| 2424 | { |
| 2425 | generated_sender_address = string_sprintf("%s@%s", |
| 2426 | local_part_quote(authenticated_id), qualify_domain_sender); |
| 2427 | } |
| 2428 | else if (submission_domain[0] == 0) /* empty => full address */ |
| 2429 | { |
| 2430 | generated_sender_address = string_sprintf("%s", |
| 2431 | authenticated_id); |
| 2432 | } |
| 2433 | else |
| 2434 | { |
| 2435 | generated_sender_address = string_sprintf("%s@%s", |
| 2436 | local_part_quote(authenticated_id), submission_domain); |
| 2437 | } |
| 2438 | } |
| 2439 | else |
| 2440 | generated_sender_address = string_sprintf("%s@%s", |
| 2441 | local_part_quote(originator_login), qualify_domain_sender); |
| 2442 | |
| 2443 | /* Remove permitted prefixes and suffixes from the local part of the From: |
| 2444 | address before doing the comparison with the generated sender. */ |
| 2445 | |
| 2446 | if (from_address != NULL) |
| 2447 | { |
| 2448 | int slen; |
| 2449 | uschar *at = (domain == 0)? NULL : from_address + domain - 1; |
| 2450 | |
| 2451 | if (at != NULL) *at = 0; |
| 2452 | from_address += route_check_prefix(from_address, local_from_prefix); |
| 2453 | slen = route_check_suffix(from_address, local_from_suffix); |
| 2454 | if (slen > 0) |
| 2455 | { |
| 2456 | memmove(from_address+slen, from_address, Ustrlen(from_address)-slen); |
| 2457 | from_address += slen; |
| 2458 | } |
| 2459 | if (at != NULL) *at = '@'; |
| 2460 | |
| 2461 | if (strcmpic(generated_sender_address, from_address) == 0 || |
| 2462 | (domain == 0 && strcmpic(from_address, originator_login) == 0)) |
| 2463 | make_sender = FALSE; |
| 2464 | } |
| 2465 | |
| 2466 | /* We have to cause the Sender header to be rewritten if there are |
| 2467 | appropriate rewriting rules. */ |
| 2468 | |
| 2469 | if (make_sender) |
| 2470 | { |
| 2471 | if (submission_mode && originator_name[0] == 0) |
| 2472 | header_add(htype_sender, "%sSender: %s\n", resent_prefix, |
| 2473 | generated_sender_address); |
| 2474 | else |
| 2475 | header_add(htype_sender, "%sSender: %s <%s>\n", |
| 2476 | resent_prefix, originator_name, generated_sender_address); |
| 2477 | } |
| 2478 | |
| 2479 | /* Ensure that a non-null envelope sender address corresponds to the |
| 2480 | submission mode sender address. */ |
| 2481 | |
| 2482 | if (submission_mode && sender_address[0] != 0) |
| 2483 | { |
| 2484 | if (sender_address_unrewritten == NULL) |
| 2485 | sender_address_unrewritten = sender_address; |
| 2486 | sender_address = generated_sender_address; |
| 2487 | log_write(L_address_rewrite, LOG_MAIN, |
| 2488 | "\"%s\" from env-from rewritten as \"%s\" by submission mode", |
| 2489 | sender_address_unrewritten, generated_sender_address); |
| 2490 | } |
| 2491 | } |
| 2492 | |
| 2493 | |
| 2494 | /* If there are any rewriting rules, apply them to the sender address, unless |
| 2495 | it has already been rewritten as part of verification for SMTP input. */ |
| 2496 | |
| 2497 | if (global_rewrite_rules != NULL && sender_address_unrewritten == NULL && |
| 2498 | sender_address[0] != 0) |
| 2499 | { |
| 2500 | sender_address = rewrite_address(sender_address, FALSE, TRUE, |
| 2501 | global_rewrite_rules, rewrite_existflags); |
| 2502 | DEBUG(D_receive|D_rewrite) |
| 2503 | debug_printf("rewritten sender = %s\n", sender_address); |
| 2504 | } |
| 2505 | |
| 2506 | |
| 2507 | /* The headers must be run through rewrite_header(), because it ensures that |
| 2508 | addresses are fully qualified, as well as applying any rewriting rules that may |
| 2509 | exist. |
| 2510 | |
| 2511 | Qualification of header addresses in a message from a remote host happens only |
| 2512 | if the host is in sender_unqualified_hosts or recipient_unqualified hosts, as |
| 2513 | appropriate. For local messages, qualification always happens, unless -bnq is |
| 2514 | used to explicitly suppress it. No rewriting is done for an unqualified address |
| 2515 | that is left untouched. |
| 2516 | |
| 2517 | We start at the second header, skipping our own Received:. This rewriting is |
| 2518 | documented as happening *after* recipient addresses are taken from the headers |
| 2519 | by the -t command line option. An added Sender: gets rewritten here. */ |
| 2520 | |
| 2521 | for (h = header_list->next; h != NULL; h = h->next) |
| 2522 | { |
| 2523 | header_line *newh = rewrite_header(h, NULL, NULL, global_rewrite_rules, |
| 2524 | rewrite_existflags, TRUE); |
| 2525 | if (newh != NULL) h = newh; |
| 2526 | } |
| 2527 | |
| 2528 | |
| 2529 | /* An RFC 822 (sic) message is not legal unless it has at least one of "to", |
| 2530 | "cc", or "bcc". Note that although the minimal examples in RFC822 show just |
| 2531 | "to" or "bcc", the full syntax spec allows "cc" as well. If any resent- header |
| 2532 | exists, this applies to the set of resent- headers rather than the normal set. |
| 2533 | |
| 2534 | The requirement for a recipient header has been removed in RFC 2822. Earlier |
| 2535 | versions of Exim added a To: header for locally submitted messages, and an |
| 2536 | empty Bcc: header for others or when always_bcc was set. In the light of the |
| 2537 | changes in RFC 2822, we now always add Bcc: just in case there are still MTAs |
| 2538 | out there that insist on the RFC 822 syntax. |
| 2539 | |
| 2540 | November 2003: While generally revising what Exim does to fix up headers, it |
| 2541 | seems like a good time to remove this altogether. */ |
| 2542 | |
| 2543 | /****** |
| 2544 | if (!to_or_cc_header_exists && !bcc_header_exists) |
| 2545 | header_add(htype_bcc, "Bcc:\n"); |
| 2546 | ******/ |
| 2547 | |
| 2548 | /* If there is no date header, generate one if the message originates locally |
| 2549 | (i.e. not over TCP/IP) or the submission mode flag is set. Messages without |
| 2550 | Date: are not valid, but it seems to be more confusing if Exim adds one to |
| 2551 | all remotely-originated messages. */ |
| 2552 | |
| 2553 | if (!date_header_exists && (sender_host_address == NULL || submission_mode)) |
| 2554 | header_add(htype_other, "%sDate: %s\n", resent_prefix, tod_stamp(tod_full)); |
| 2555 | |
| 2556 | search_tidyup(); /* Free any cached resources */ |
| 2557 | |
| 2558 | /* Show the complete set of headers if debugging. Note that the first one (the |
| 2559 | new Received:) has not yet been set. */ |
| 2560 | |
| 2561 | DEBUG(D_receive) |
| 2562 | { |
| 2563 | debug_printf(">>Headers after rewriting and local additions:\n"); |
| 2564 | for (h = header_list->next; h != NULL; h = h->next) |
| 2565 | debug_printf("%c %s", h->type, h->text); |
| 2566 | debug_printf("\n"); |
| 2567 | } |
| 2568 | |
| 2569 | /* The headers are now complete in store. If we are running in filter |
| 2570 | testing mode, that is all this function does. Return TRUE if the message |
| 2571 | ended with a dot. */ |
| 2572 | |
| 2573 | if (filter_test != FTEST_NONE) |
| 2574 | { |
| 2575 | process_info[process_info_len] = 0; |
| 2576 | return message_ended == END_DOT; |
| 2577 | } |
| 2578 | |
| 2579 | /* Open a new spool file for the data portion of the message. We need |
| 2580 | to access it both via a file descriptor and a stream. Try to make the |
| 2581 | directory if it isn't there. Note re use of sprintf: spool_directory |
| 2582 | is checked on input to be < 200 characters long. */ |
| 2583 | |
| 2584 | sprintf(CS spool_name, "%s/input/%s/%s-D", spool_directory, message_subdir, |
| 2585 | message_id); |
| 2586 | data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE); |
| 2587 | if (data_fd < 0) |
| 2588 | { |
| 2589 | if (errno == ENOENT) |
| 2590 | { |
| 2591 | uschar temp[16]; |
| 2592 | sprintf(CS temp, "input/%s", message_subdir); |
| 2593 | if (message_subdir[0] == 0) temp[5] = 0; |
| 2594 | (void)directory_make(spool_directory, temp, INPUT_DIRECTORY_MODE, TRUE); |
| 2595 | data_fd = Uopen(spool_name, O_RDWR|O_CREAT|O_EXCL, SPOOL_MODE); |
| 2596 | } |
| 2597 | if (data_fd < 0) |
| 2598 | log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Failed to create spool file %s: %s", |
| 2599 | spool_name, strerror(errno)); |
| 2600 | } |
| 2601 | |
| 2602 | /* Make sure the file's group is the Exim gid, and double-check the mode |
| 2603 | because the group setting doesn't always get set automatically. */ |
| 2604 | |
| 2605 | (void)fchown(data_fd, exim_uid, exim_gid); |
| 2606 | (void)fchmod(data_fd, SPOOL_MODE); |
| 2607 | |
| 2608 | /* We now have data file open. Build a stream for it and lock it. We lock only |
| 2609 | the first line of the file (containing the message ID) because otherwise there |
| 2610 | are problems when Exim is run under Cygwin (I'm told). See comments in |
| 2611 | spool_in.c, where the same locking is done. */ |
| 2612 | |
| 2613 | data_file = fdopen(data_fd, "w+"); |
| 2614 | lock_data.l_type = F_WRLCK; |
| 2615 | lock_data.l_whence = SEEK_SET; |
| 2616 | lock_data.l_start = 0; |
| 2617 | lock_data.l_len = SPOOL_DATA_START_OFFSET; |
| 2618 | |
| 2619 | if (fcntl(data_fd, F_SETLK, &lock_data) < 0) |
| 2620 | log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Cannot lock %s (%d): %s", spool_name, |
| 2621 | errno, strerror(errno)); |
| 2622 | |
| 2623 | /* We have an open, locked data file. Write the message id to it to make it |
| 2624 | self-identifying. Then read the remainder of the input of this message and |
| 2625 | write it to the data file. If the variable next != NULL, it contains the first |
| 2626 | data line (which was read as a header but then turned out not to have the right |
| 2627 | format); write it (remembering that it might contain binary zeros). The result |
| 2628 | of fwrite() isn't inspected; instead we call ferror() below. */ |
| 2629 | |
| 2630 | fprintf(data_file, "%s-D\n", message_id); |
| 2631 | if (next != NULL) |
| 2632 | { |
| 2633 | uschar *s = next->text; |
| 2634 | int len = next->slen; |
| 2635 | (void)fwrite(s, 1, len, data_file); |
| 2636 | body_linecount++; /* Assumes only 1 line */ |
| 2637 | } |
| 2638 | |
| 2639 | /* Note that we might already be at end of file, or the logical end of file |
| 2640 | (indicated by '.'), or might have encountered an error while writing the |
| 2641 | message id or "next" line. */ |
| 2642 | |
| 2643 | if (!ferror(data_file) && !(receive_feof)() && message_ended != END_DOT) |
| 2644 | { |
| 2645 | if (smtp_input) |
| 2646 | { |
| 2647 | message_ended = read_message_data_smtp(data_file); |
| 2648 | receive_linecount++; /* The terminating "." line */ |
| 2649 | } |
| 2650 | else message_ended = read_message_data(data_file); |
| 2651 | |
| 2652 | receive_linecount += body_linecount; /* For BSMTP errors mainly */ |
| 2653 | message_linecount += body_linecount; |
| 2654 | |
| 2655 | /* Handle premature termination of SMTP */ |
| 2656 | |
| 2657 | if (smtp_input && message_ended == END_EOF) |
| 2658 | { |
| 2659 | Uunlink(spool_name); /* Lose data file when closed */ |
| 2660 | message_id[0] = 0; /* Indicate no message accepted */ |
| 2661 | smtp_reply = handle_lost_connection(US""); |
| 2662 | smtp_yield = FALSE; |
| 2663 | goto TIDYUP; /* Skip to end of function */ |
| 2664 | } |
| 2665 | |
| 2666 | /* Handle message that is too big. Don't use host_or_ident() in the log |
| 2667 | message; we want to see the ident value even for non-remote messages. */ |
| 2668 | |
| 2669 | if (message_ended == END_SIZE) |
| 2670 | { |
| 2671 | Uunlink(spool_name); /* Lose the data file when closed */ |
| 2672 | if (smtp_input) receive_swallow_smtp(); /* Swallow incoming SMTP */ |
| 2673 | |
| 2674 | log_write(L_size_reject, LOG_MAIN|LOG_REJECT, "rejected from <%s>%s%s%s%s: " |
| 2675 | "message too big: read=%d max=%d", |
| 2676 | sender_address, |
| 2677 | (sender_fullhost == NULL)? "" : " H=", |
| 2678 | (sender_fullhost == NULL)? US"" : sender_fullhost, |
| 2679 | (sender_ident == NULL)? "" : " U=", |
| 2680 | (sender_ident == NULL)? US"" : sender_ident, |
| 2681 | message_size, |
| 2682 | thismessage_size_limit); |
| 2683 | |
| 2684 | if (smtp_input) |
| 2685 | { |
| 2686 | smtp_reply = US"552 Message size exceeds maximum permitted"; |
| 2687 | message_id[0] = 0; /* Indicate no message accepted */ |
| 2688 | goto TIDYUP; /* Skip to end of function */ |
| 2689 | } |
| 2690 | else |
| 2691 | { |
| 2692 | fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET); |
| 2693 | give_local_error(ERRMESS_TOOBIG, |
| 2694 | string_sprintf("message too big (max=%d)", thismessage_size_limit), |
| 2695 | US"message rejected: ", error_rc, data_file, header_list); |
| 2696 | /* Does not return */ |
| 2697 | } |
| 2698 | } |
| 2699 | } |
| 2700 | |
| 2701 | /* Restore the standard SIGALRM handler for any subsequent processing. (For |
| 2702 | example, there may be some expansion in an ACL that uses a timer.) */ |
| 2703 | |
| 2704 | os_non_restarting_signal(SIGALRM, sigalrm_handler); |
| 2705 | |
| 2706 | /* The message body has now been read into the data file. Call fflush() to |
| 2707 | empty the buffers in C, and then call fsync() to get the data written out onto |
| 2708 | the disk, as fflush() doesn't do this (or at least, it isn't documented as |
| 2709 | having to do this). If there was an I/O error on either input or output, |
| 2710 | attempt to send an error message, and unlink the spool file. For non-SMTP input |
| 2711 | we can then give up. Note that for SMTP input we must swallow the remainder of |
| 2712 | the input in cases of output errors, since the far end doesn't expect to see |
| 2713 | anything until the terminating dot line is sent. */ |
| 2714 | |
| 2715 | if (fflush(data_file) == EOF || ferror(data_file) || |
| 2716 | fsync(fileno(data_file)) < 0 || (receive_ferror)()) |
| 2717 | { |
| 2718 | uschar *msg_errno = US strerror(errno); |
| 2719 | BOOL input_error = (receive_ferror)() != 0; |
| 2720 | uschar *msg = string_sprintf("%s error (%s) while receiving message from %s", |
| 2721 | input_error? "Input read" : "Spool write", |
| 2722 | msg_errno, |
| 2723 | (sender_fullhost != NULL)? sender_fullhost : sender_ident); |
| 2724 | |
| 2725 | log_write(0, LOG_MAIN, "Message abandoned: %s", msg); |
| 2726 | Uunlink(spool_name); /* Lose the data file */ |
| 2727 | |
| 2728 | if (smtp_input) |
| 2729 | { |
| 2730 | if (input_error) |
| 2731 | smtp_reply = US"451 Error while reading input data"; |
| 2732 | else |
| 2733 | { |
| 2734 | smtp_reply = US"451 Error while writing spool file"; |
| 2735 | receive_swallow_smtp(); |
| 2736 | } |
| 2737 | message_id[0] = 0; /* Indicate no message accepted */ |
| 2738 | goto TIDYUP; /* Skip to end of function */ |
| 2739 | } |
| 2740 | |
| 2741 | else |
| 2742 | { |
| 2743 | fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET); |
| 2744 | give_local_error(ERRMESS_IOERR, msg, US"", error_rc, data_file, |
| 2745 | header_list); |
| 2746 | /* Does not return */ |
| 2747 | } |
| 2748 | } |
| 2749 | |
| 2750 | |
| 2751 | /* No I/O errors were encountered while writing the data file. */ |
| 2752 | |
| 2753 | DEBUG(D_receive) debug_printf("Data file written for message %s\n", message_id); |
| 2754 | |
| 2755 | |
| 2756 | /* If there were any bad addresses extracted by -t, or there were no recipients |
| 2757 | left after -t, send a message to the sender of this message, or write it to |
| 2758 | stderr if the error handling option is set that way. Note that there may |
| 2759 | legitimately be no recipients for an SMTP message if they have all been removed |
| 2760 | by "discard". |
| 2761 | |
| 2762 | We need to rewind the data file in order to read it. In the case of no |
| 2763 | recipients or stderr error writing, throw the data file away afterwards, and |
| 2764 | exit. (This can't be SMTP, which always ensures there's at least one |
| 2765 | syntactically good recipient address.) */ |
| 2766 | |
| 2767 | if (extract_recip && (bad_addresses != NULL || recipients_count == 0)) |
| 2768 | { |
| 2769 | DEBUG(D_receive) |
| 2770 | { |
| 2771 | if (recipients_count == 0) debug_printf("*** No recipients\n"); |
| 2772 | if (bad_addresses != NULL) |
| 2773 | { |
| 2774 | error_block *eblock = bad_addresses; |
| 2775 | debug_printf("*** Bad address(es)\n"); |
| 2776 | while (eblock != NULL) |
| 2777 | { |
| 2778 | debug_printf(" %s: %s\n", eblock->text1, eblock->text2); |
| 2779 | eblock = eblock->next; |
| 2780 | } |
| 2781 | } |
| 2782 | } |
| 2783 | |
| 2784 | fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET); |
| 2785 | |
| 2786 | /* If configured to send errors to the sender, but this fails, force |
| 2787 | a failure error code. We use a special one for no recipients so that it |
| 2788 | can be detected by the autoreply transport. Otherwise error_rc is set to |
| 2789 | errors_sender_rc, which is EXIT_FAILURE unless -oee was given, in which case |
| 2790 | it is EXIT_SUCCESS. */ |
| 2791 | |
| 2792 | if (error_handling == ERRORS_SENDER) |
| 2793 | { |
| 2794 | if (!moan_to_sender( |
| 2795 | (bad_addresses == NULL)? |
| 2796 | (extracted_ignored? ERRMESS_IGADDRESS : ERRMESS_NOADDRESS) : |
| 2797 | (recipients_list == NULL)? ERRMESS_BADNOADDRESS : ERRMESS_BADADDRESS, |
| 2798 | bad_addresses, header_list, data_file, FALSE)) |
| 2799 | error_rc = (bad_addresses == NULL)? EXIT_NORECIPIENTS : EXIT_FAILURE; |
| 2800 | } |
| 2801 | else |
| 2802 | { |
| 2803 | if (bad_addresses == NULL) |
| 2804 | { |
| 2805 | if (extracted_ignored) |
| 2806 | fprintf(stderr, "exim: all -t recipients overridden by command line\n"); |
| 2807 | else |
| 2808 | fprintf(stderr, "exim: no recipients in message\n"); |
| 2809 | } |
| 2810 | else |
| 2811 | { |
| 2812 | fprintf(stderr, "exim: invalid address%s", |
| 2813 | (bad_addresses->next == NULL)? ":" : "es:\n"); |
| 2814 | while (bad_addresses != NULL) |
| 2815 | { |
| 2816 | fprintf(stderr, " %s: %s\n", bad_addresses->text1, |
| 2817 | bad_addresses->text2); |
| 2818 | bad_addresses = bad_addresses->next; |
| 2819 | } |
| 2820 | } |
| 2821 | } |
| 2822 | |
| 2823 | if (recipients_count == 0 || error_handling == ERRORS_STDERR) |
| 2824 | { |
| 2825 | Uunlink(spool_name); |
| 2826 | (void)fclose(data_file); |
| 2827 | exim_exit(error_rc); |
| 2828 | } |
| 2829 | } |
| 2830 | |
| 2831 | /* Data file successfully written. Generate text for the Received: header by |
| 2832 | expanding the configured string, and adding a timestamp. By leaving this |
| 2833 | operation till now, we ensure that the timestamp is the time that message |
| 2834 | reception was completed. However, this is deliberately done before calling the |
| 2835 | data ACL and local_scan(). |
| 2836 | |
| 2837 | This Received: header may therefore be inspected by the data ACL and by code in |
| 2838 | the local_scan() function. When they have run, we update the timestamp to be |
| 2839 | the final time of reception. |
| 2840 | |
| 2841 | If there is just one recipient, set up its value in the $received_for variable |
| 2842 | for use when we generate the Received: header. |
| 2843 | |
| 2844 | Note: the checking for too many Received: headers is handled by the delivery |
| 2845 | code. */ |
| 2846 | |
| 2847 | timestamp = expand_string(US"${tod_full}"); |
| 2848 | if (recipients_count == 1) received_for = recipients_list[0].address; |
| 2849 | received = expand_string(received_header_text); |
| 2850 | received_for = NULL; |
| 2851 | |
| 2852 | if (received == NULL) |
| 2853 | { |
| 2854 | Uunlink(spool_name); /* Lose the data file */ |
| 2855 | log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Expansion of \"%s\" " |
| 2856 | "(received_header_text) failed: %s", string_printing(received_header_text), |
| 2857 | expand_string_message); |
| 2858 | } |
| 2859 | |
| 2860 | /* The first element on the header chain is reserved for the Received header, |
| 2861 | so all we have to do is fill in the text pointer, and set the type. However, if |
| 2862 | the result of the expansion is an empty string, we leave the header marked as |
| 2863 | "old" so as to refrain from adding a Received header. */ |
| 2864 | |
| 2865 | if (received[0] == 0) |
| 2866 | { |
| 2867 | received_header->text = string_sprintf("Received: ; %s\n", timestamp); |
| 2868 | received_header->type = htype_old; |
| 2869 | } |
| 2870 | else |
| 2871 | { |
| 2872 | received_header->text = string_sprintf("%s; %s\n", received, timestamp); |
| 2873 | received_header->type = htype_received; |
| 2874 | } |
| 2875 | |
| 2876 | received_header->slen = Ustrlen(received_header->text); |
| 2877 | |
| 2878 | DEBUG(D_receive) debug_printf(">>Generated Received: header line\n%c %s", |
| 2879 | received_header->type, received_header->text); |
| 2880 | |
| 2881 | /* Set the value of message_body_size for the DATA ACL and for local_scan() */ |
| 2882 | |
| 2883 | message_body_size = (fstat(data_fd, &statbuf) == 0)? |
| 2884 | statbuf.st_size - SPOOL_DATA_START_OFFSET : -1; |
| 2885 | |
| 2886 | /* If an ACL from any RCPT commands set up any warning headers to add, do so |
| 2887 | now, before running the DATA ACL. */ |
| 2888 | |
| 2889 | add_acl_headers(US"MAIL or RCPT"); |
| 2890 | |
| 2891 | /* If an ACL is specified for checking things at this stage of reception of a |
| 2892 | message, run it, unless all the recipients were removed by "discard" in earlier |
| 2893 | ACLs. That is the only case in which recipients_count can be zero at this |
| 2894 | stage. Set deliver_datafile to point to the data file so that $message_body and |
| 2895 | $message_body_end can be extracted if needed. Allow $recipients in expansions. |
| 2896 | */ |
| 2897 | |
| 2898 | deliver_datafile = data_fd; |
| 2899 | |
| 2900 | if (recipients_count == 0) |
| 2901 | { |
| 2902 | blackholed_by = recipients_discarded? US"MAIL ACL" : US"RCPT ACL"; |
| 2903 | } |
| 2904 | else |
| 2905 | { |
| 2906 | enable_dollar_recipients = TRUE; |
| 2907 | |
| 2908 | /* Handle interactive SMTP messages */ |
| 2909 | |
| 2910 | if (smtp_input && !smtp_batched_input) |
| 2911 | { |
| 2912 | |
| 2913 | #ifdef EXPERIMENTAL_DOMAINKEYS |
| 2914 | dk_exim_verify_finish(); |
| 2915 | #endif |
| 2916 | |
| 2917 | #ifdef WITH_CONTENT_SCAN |
| 2918 | if (acl_smtp_mime != NULL && |
| 2919 | !run_mime_acl(acl_smtp_mime, &smtp_yield, &smtp_reply, &blackholed_by)) |
| 2920 | goto TIDYUP; |
| 2921 | #endif /* WITH_CONTENT_SCAN */ |
| 2922 | |
| 2923 | /* Check the recipients count again, as the MIME ACL might have changed |
| 2924 | them. */ |
| 2925 | |
| 2926 | if (acl_smtp_data != NULL && recipients_count > 0) |
| 2927 | { |
| 2928 | uschar *user_msg, *log_msg; |
| 2929 | rc = acl_check(ACL_WHERE_DATA, NULL, acl_smtp_data, &user_msg, &log_msg); |
| 2930 | add_acl_headers(US"DATA"); |
| 2931 | if (rc == DISCARD) |
| 2932 | { |
| 2933 | recipients_count = 0; |
| 2934 | blackholed_by = US"DATA ACL"; |
| 2935 | if (log_msg != NULL) |
| 2936 | blackhole_log_msg = string_sprintf(": %s", log_msg); |
| 2937 | } |
| 2938 | else if (rc != OK) |
| 2939 | { |
| 2940 | Uunlink(spool_name); |
| 2941 | #ifdef WITH_CONTENT_SCAN |
| 2942 | unspool_mbox(); |
| 2943 | #endif |
| 2944 | if (smtp_handle_acl_fail(ACL_WHERE_DATA, rc, user_msg, log_msg) != 0) |
| 2945 | smtp_yield = FALSE; /* No more messsages after dropped connection */ |
| 2946 | smtp_reply = US""; /* Indicate reply already sent */ |
| 2947 | message_id[0] = 0; /* Indicate no message accepted */ |
| 2948 | goto TIDYUP; /* Skip to end of function */ |
| 2949 | } |
| 2950 | } |
| 2951 | } |
| 2952 | |
| 2953 | /* Handle non-SMTP and batch SMTP (i.e. non-interactive) messages. Note that |
| 2954 | we cannot take different actions for permanent and temporary rejections. */ |
| 2955 | |
| 2956 | else |
| 2957 | { |
| 2958 | |
| 2959 | #ifdef WITH_CONTENT_SCAN |
| 2960 | if (acl_not_smtp_mime != NULL && |
| 2961 | !run_mime_acl(acl_not_smtp_mime, &smtp_yield, &smtp_reply, |
| 2962 | &blackholed_by)) |
| 2963 | goto TIDYUP; |
| 2964 | #endif /* WITH_CONTENT_SCAN */ |
| 2965 | |
| 2966 | if (acl_not_smtp != NULL) |
| 2967 | { |
| 2968 | uschar *user_msg, *log_msg; |
| 2969 | rc = acl_check(ACL_WHERE_NOTSMTP, NULL, acl_not_smtp, &user_msg, &log_msg); |
| 2970 | if (rc == DISCARD) |
| 2971 | { |
| 2972 | recipients_count = 0; |
| 2973 | blackholed_by = US"non-SMTP ACL"; |
| 2974 | if (log_msg != NULL) |
| 2975 | blackhole_log_msg = string_sprintf(": %s", log_msg); |
| 2976 | } |
| 2977 | else if (rc != OK) |
| 2978 | { |
| 2979 | Uunlink(spool_name); |
| 2980 | #ifdef WITH_CONTENT_SCAN |
| 2981 | unspool_mbox(); |
| 2982 | #endif |
| 2983 | log_write(0, LOG_MAIN|LOG_REJECT, "F=<%s> rejected by non-SMTP ACL: %s", |
| 2984 | sender_address, log_msg); |
| 2985 | if (user_msg == NULL) user_msg = US"local configuration problem"; |
| 2986 | if (smtp_batched_input) |
| 2987 | { |
| 2988 | moan_smtp_batch(NULL, "%d %s", 550, user_msg); |
| 2989 | /* Does not return */ |
| 2990 | } |
| 2991 | else |
| 2992 | { |
| 2993 | fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET); |
| 2994 | give_local_error(ERRMESS_LOCAL_ACL, user_msg, |
| 2995 | US"message rejected by non-SMTP ACL: ", error_rc, data_file, |
| 2996 | header_list); |
| 2997 | /* Does not return */ |
| 2998 | } |
| 2999 | } |
| 3000 | add_acl_headers(US"non-SMTP"); |
| 3001 | } |
| 3002 | } |
| 3003 | |
| 3004 | /* The applicable ACLs have been run */ |
| 3005 | |
| 3006 | if (deliver_freeze) frozen_by = US"ACL"; /* for later logging */ |
| 3007 | if (queue_only_policy) queued_by = US"ACL"; |
| 3008 | |
| 3009 | enable_dollar_recipients = FALSE; |
| 3010 | } |
| 3011 | |
| 3012 | #ifdef WITH_CONTENT_SCAN |
| 3013 | unspool_mbox(); |
| 3014 | #endif |
| 3015 | |
| 3016 | /* The final check on the message is to run the scan_local() function. The |
| 3017 | version supplied with Exim always accepts, but this is a hook for sysadmins to |
| 3018 | supply their own checking code. The local_scan() function is run even when all |
| 3019 | the recipients have been discarded. */ |
| 3020 | |
| 3021 | lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET); |
| 3022 | |
| 3023 | /* Arrange to catch crashes in local_scan(), so that the -D file gets |
| 3024 | deleted, and the incident gets logged. */ |
| 3025 | |
| 3026 | os_non_restarting_signal(SIGSEGV, local_scan_crash_handler); |
| 3027 | os_non_restarting_signal(SIGFPE, local_scan_crash_handler); |
| 3028 | os_non_restarting_signal(SIGILL, local_scan_crash_handler); |
| 3029 | os_non_restarting_signal(SIGBUS, local_scan_crash_handler); |
| 3030 | |
| 3031 | DEBUG(D_receive) debug_printf("calling local_scan(); timeout=%d\n", |
| 3032 | local_scan_timeout); |
| 3033 | local_scan_data = NULL; |
| 3034 | |
| 3035 | os_non_restarting_signal(SIGALRM, local_scan_timeout_handler); |
| 3036 | if (local_scan_timeout > 0) alarm(local_scan_timeout); |
| 3037 | rc = local_scan(data_fd, &local_scan_data); |
| 3038 | alarm(0); |
| 3039 | os_non_restarting_signal(SIGALRM, sigalrm_handler); |
| 3040 | |
| 3041 | store_pool = POOL_MAIN; /* In case changed */ |
| 3042 | DEBUG(D_receive) debug_printf("local_scan() returned %d %s\n", rc, |
| 3043 | local_scan_data); |
| 3044 | |
| 3045 | os_non_restarting_signal(SIGSEGV, SIG_DFL); |
| 3046 | os_non_restarting_signal(SIGFPE, SIG_DFL); |
| 3047 | os_non_restarting_signal(SIGILL, SIG_DFL); |
| 3048 | os_non_restarting_signal(SIGBUS, SIG_DFL); |
| 3049 | |
| 3050 | /* The length check is paranoia against some runaway code, and also because |
| 3051 | (for a success return) lines in the spool file are read into big_buffer. */ |
| 3052 | |
| 3053 | if (local_scan_data != NULL) |
| 3054 | { |
| 3055 | int len = Ustrlen(local_scan_data); |
| 3056 | if (len > LOCAL_SCAN_MAX_RETURN) len = LOCAL_SCAN_MAX_RETURN; |
| 3057 | local_scan_data = string_copyn(local_scan_data, len); |
| 3058 | } |
| 3059 | |
| 3060 | if (rc == LOCAL_SCAN_ACCEPT_FREEZE) |
| 3061 | { |
| 3062 | if (!deliver_freeze) /* ACL might have already frozen */ |
| 3063 | { |
| 3064 | deliver_freeze = TRUE; |
| 3065 | deliver_frozen_at = time(NULL); |
| 3066 | frozen_by = US"local_scan()"; |
| 3067 | } |
| 3068 | rc = LOCAL_SCAN_ACCEPT; |
| 3069 | } |
| 3070 | else if (rc == LOCAL_SCAN_ACCEPT_QUEUE) |
| 3071 | { |
| 3072 | if (!queue_only_policy) /* ACL might have already queued */ |
| 3073 | { |
| 3074 | queue_only_policy = TRUE; |
| 3075 | queued_by = US"local_scan()"; |
| 3076 | } |
| 3077 | rc = LOCAL_SCAN_ACCEPT; |
| 3078 | } |
| 3079 | |
| 3080 | /* Message accepted: remove newlines in local_scan_data because otherwise |
| 3081 | the spool file gets corrupted. Ensure that all recipients are qualified. */ |
| 3082 | |
| 3083 | if (rc == LOCAL_SCAN_ACCEPT) |
| 3084 | { |
| 3085 | if (local_scan_data != NULL) |
| 3086 | { |
| 3087 | uschar *s; |
| 3088 | for (s = local_scan_data; *s != 0; s++) if (*s == '\n') *s = ' '; |
| 3089 | } |
| 3090 | for (i = 0; i < recipients_count; i++) |
| 3091 | { |
| 3092 | recipient_item *r = recipients_list + i; |
| 3093 | r->address = rewrite_address_qualify(r->address, TRUE); |
| 3094 | if (r->errors_to != NULL) |
| 3095 | r->errors_to = rewrite_address_qualify(r->errors_to, TRUE); |
| 3096 | } |
| 3097 | if (recipients_count == 0 && blackholed_by == NULL) |
| 3098 | blackholed_by = US"local_scan"; |
| 3099 | } |
| 3100 | |
| 3101 | /* Message rejected: newlines permitted in local_scan_data to generate |
| 3102 | multiline SMTP responses. */ |
| 3103 | |
| 3104 | else |
| 3105 | { |
| 3106 | uschar *istemp = US""; |
| 3107 | uschar *s = NULL; |
| 3108 | int size = 0; |
| 3109 | int sptr = 0; |
| 3110 | int code; |
| 3111 | |
| 3112 | errmsg = local_scan_data; |
| 3113 | |
| 3114 | Uunlink(spool_name); /* Cancel this message */ |
| 3115 | switch(rc) |
| 3116 | { |
| 3117 | default: |
| 3118 | log_write(0, LOG_MAIN, "invalid return %d from local_scan(). Temporary " |
| 3119 | "rejection given", rc); |
| 3120 | goto TEMPREJECT; |
| 3121 | |
| 3122 | case LOCAL_SCAN_REJECT_NOLOGHDR: |
| 3123 | log_extra_selector &= ~LX_rejected_header; |
| 3124 | /* Fall through */ |
| 3125 | |
| 3126 | case LOCAL_SCAN_REJECT: |
| 3127 | code = 550; |
| 3128 | if (errmsg == NULL) errmsg = US"Administrative prohibition"; |
| 3129 | break; |
| 3130 | |
| 3131 | case LOCAL_SCAN_TEMPREJECT_NOLOGHDR: |
| 3132 | log_extra_selector &= ~LX_rejected_header; |
| 3133 | /* Fall through */ |
| 3134 | |
| 3135 | case LOCAL_SCAN_TEMPREJECT: |
| 3136 | TEMPREJECT: |
| 3137 | code = 451; |
| 3138 | if (errmsg == NULL) errmsg = US"Temporary local problem"; |
| 3139 | istemp = US"temporarily "; |
| 3140 | break; |
| 3141 | } |
| 3142 | |
| 3143 | s = string_append(s, &size, &sptr, 2, US"F=", |
| 3144 | (sender_address[0] == 0)? US"<>" : sender_address); |
| 3145 | s = add_host_info_for_log(s, &size, &sptr); |
| 3146 | s[sptr] = 0; |
| 3147 | |
| 3148 | log_write(0, LOG_MAIN|LOG_REJECT, "%s %srejected by local_scan(): %.256s", |
| 3149 | s, istemp, string_printing(errmsg)); |
| 3150 | |
| 3151 | if (smtp_input) |
| 3152 | { |
| 3153 | if (!smtp_batched_input) |
| 3154 | { |
| 3155 | smtp_respond(code, TRUE, errmsg); |
| 3156 | message_id[0] = 0; /* Indicate no message accepted */ |
| 3157 | smtp_reply = US""; /* Indicate reply already sent */ |
| 3158 | goto TIDYUP; /* Skip to end of function */ |
| 3159 | } |
| 3160 | else |
| 3161 | { |
| 3162 | moan_smtp_batch(NULL, "%d %s", code, errmsg); |
| 3163 | /* Does not return */ |
| 3164 | } |
| 3165 | } |
| 3166 | else |
| 3167 | { |
| 3168 | fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET); |
| 3169 | give_local_error(ERRMESS_LOCAL_SCAN, errmsg, |
| 3170 | US"message rejected by local scan code: ", error_rc, data_file, |
| 3171 | header_list); |
| 3172 | /* Does not return */ |
| 3173 | } |
| 3174 | } |
| 3175 | |
| 3176 | /* Reset signal handlers to ignore signals that previously would have caused |
| 3177 | the message to be abandoned. */ |
| 3178 | |
| 3179 | signal(SIGTERM, SIG_IGN); |
| 3180 | signal(SIGINT, SIG_IGN); |
| 3181 | |
| 3182 | /* Ensure the first time flag is set in the newly-received message. */ |
| 3183 | |
| 3184 | deliver_firsttime = TRUE; |
| 3185 | |
| 3186 | #ifdef EXPERIMENTAL_BRIGHTMAIL |
| 3187 | if (bmi_run == 1) { |
| 3188 | /* rewind data file */ |
| 3189 | lseek(data_fd, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET); |
| 3190 | bmi_verdicts = bmi_process_message(header_list, data_fd); |
| 3191 | }; |
| 3192 | #endif |
| 3193 | |
| 3194 | /* Update the timstamp in our Received: header to account for any time taken by |
| 3195 | an ACL or by local_scan(). The new time is the time that all reception |
| 3196 | processing is complete. */ |
| 3197 | |
| 3198 | timestamp = expand_string(US"${tod_full}"); |
| 3199 | tslen = Ustrlen(timestamp); |
| 3200 | |
| 3201 | memcpy(received_header->text + received_header->slen - tslen - 1, |
| 3202 | timestamp, tslen); |
| 3203 | |
| 3204 | /* In MUA wrapper mode, ignore queueing actions set by ACL or local_scan() */ |
| 3205 | |
| 3206 | if (mua_wrapper) |
| 3207 | { |
| 3208 | deliver_freeze = FALSE; |
| 3209 | queue_only_policy = FALSE; |
| 3210 | } |
| 3211 | |
| 3212 | /* Keep the data file open until we have written the header file, in order to |
| 3213 | hold onto the lock. In a -bh run, or if the message is to be blackholed, we |
| 3214 | don't write the header file, and we unlink the data file. If writing the header |
| 3215 | file fails, we have failed to accept this message. */ |
| 3216 | |
| 3217 | if (host_checking || blackholed_by != NULL) |
| 3218 | { |
| 3219 | header_line *h; |
| 3220 | Uunlink(spool_name); |
| 3221 | msg_size = 0; /* Compute size for log line */ |
| 3222 | for (h = header_list; h != NULL; h = h->next) |
| 3223 | if (h->type != '*') msg_size += h->slen; |
| 3224 | } |
| 3225 | |
| 3226 | /* Write the -H file */ |
| 3227 | |
| 3228 | else |
| 3229 | { |
| 3230 | if ((msg_size = spool_write_header(message_id, SW_RECEIVING, &errmsg)) < 0) |
| 3231 | { |
| 3232 | log_write(0, LOG_MAIN, "Message abandoned: %s", errmsg); |
| 3233 | Uunlink(spool_name); /* Lose the data file */ |
| 3234 | |
| 3235 | if (smtp_input) |
| 3236 | { |
| 3237 | smtp_reply = US"451 Error in writing spool file"; |
| 3238 | message_id[0] = 0; /* Indicate no message accepted */ |
| 3239 | goto TIDYUP; |
| 3240 | } |
| 3241 | else |
| 3242 | { |
| 3243 | fseek(data_file, (long int)SPOOL_DATA_START_OFFSET, SEEK_SET); |
| 3244 | give_local_error(ERRMESS_IOERR, errmsg, US"", error_rc, data_file, |
| 3245 | header_list); |
| 3246 | /* Does not return */ |
| 3247 | } |
| 3248 | } |
| 3249 | } |
| 3250 | |
| 3251 | |
| 3252 | /* The message has now been successfully received. */ |
| 3253 | |
| 3254 | receive_messagecount++; |
| 3255 | |
| 3256 | /* In SMTP sessions we may receive several in one connection. After each one, |
| 3257 | we wait for the clock to tick at the level of message-id granularity. This is |
| 3258 | so that the combination of time+pid is unique, even on systems where the pid |
| 3259 | can be re-used within our time interval. We can't shorten the interval without |
| 3260 | re-designing the message-id. See comments above where the message id is |
| 3261 | created. This is Something For The Future. */ |
| 3262 | |
| 3263 | message_id_tv.tv_usec = (message_id_tv.tv_usec/id_resolution) * id_resolution; |
| 3264 | exim_wait_tick(&message_id_tv, id_resolution); |
| 3265 | |
| 3266 | /* Add data size to written header size. We do not count the initial file name |
| 3267 | that is in the file, but we do add one extra for the notional blank line that |
| 3268 | precedes the data. This total differs from message_size in that it include the |
| 3269 | added Received: header and any other headers that got created locally. */ |
| 3270 | |
| 3271 | fflush(data_file); |
| 3272 | fstat(data_fd, &statbuf); |
| 3273 | |
| 3274 | msg_size += statbuf.st_size - SPOOL_DATA_START_OFFSET + 1; |
| 3275 | |
| 3276 | /* Generate a "message received" log entry. We do this by building up a dynamic |
| 3277 | string as required. Since we commonly want to add two items at a time, use a |
| 3278 | macro to simplify the coding. We log the arrival of a new message while the |
| 3279 | file is still locked, just in case the machine is *really* fast, and delivers |
| 3280 | it first! Include any message id that is in the message - since the syntax of a |
| 3281 | message id is actually an addr-spec, we can use the parse routine to canonicize |
| 3282 | it. */ |
| 3283 | |
| 3284 | size = 256; |
| 3285 | sptr = 0; |
| 3286 | s = store_get(size); |
| 3287 | |
| 3288 | s = string_append(s, &size, &sptr, 2, US"<= ", |
| 3289 | (sender_address[0] == 0)? US"<>" : sender_address); |
| 3290 | if (message_reference != NULL) |
| 3291 | s = string_append(s, &size, &sptr, 2, US" R=", message_reference); |
| 3292 | |
| 3293 | s = add_host_info_for_log(s, &size, &sptr); |
| 3294 | |
| 3295 | #ifdef SUPPORT_TLS |
| 3296 | if ((log_extra_selector & LX_tls_cipher) != 0 && tls_cipher != NULL) |
| 3297 | s = string_append(s, &size, &sptr, 2, US" X=", tls_cipher); |
| 3298 | if ((log_extra_selector & LX_tls_certificate_verified) != 0 && |
| 3299 | tls_cipher != NULL) |
| 3300 | s = string_append(s, &size, &sptr, 2, US" CV=", |
| 3301 | tls_certificate_verified? "yes":"no"); |
| 3302 | if ((log_extra_selector & LX_tls_peerdn) != 0 && tls_peerdn != NULL) |
| 3303 | s = string_append(s, &size, &sptr, 3, US" DN=\"", tls_peerdn, US"\""); |
| 3304 | #endif |
| 3305 | |
| 3306 | if (sender_host_authenticated != NULL) |
| 3307 | { |
| 3308 | s = string_append(s, &size, &sptr, 2, US" A=", sender_host_authenticated); |
| 3309 | if (authenticated_id != NULL) |
| 3310 | s = string_append(s, &size, &sptr, 2, US":", authenticated_id); |
| 3311 | } |
| 3312 | |
| 3313 | sprintf(CS big_buffer, "%d", msg_size); |
| 3314 | s = string_append(s, &size, &sptr, 2, US" S=", big_buffer); |
| 3315 | |
| 3316 | /* If an addr-spec in a message-id contains a quoted string, it can contain |
| 3317 | any characters except " \ and CR and so in particular it can contain NL! |
| 3318 | Therefore, make sure we use a printing-characters only version for the log. |
| 3319 | Also, allow for domain literals in the message id. */ |
| 3320 | |
| 3321 | if (msgid_header != NULL) |
| 3322 | { |
| 3323 | uschar *old_id; |
| 3324 | BOOL save_allow_domain_literals = allow_domain_literals; |
| 3325 | allow_domain_literals = TRUE; |
| 3326 | old_id = parse_extract_address(Ustrchr(msgid_header->text, ':') + 1, |
| 3327 | &errmsg, &start, &end, &domain, FALSE); |
| 3328 | allow_domain_literals = save_allow_domain_literals; |
| 3329 | if (old_id != NULL) |
| 3330 | s = string_append(s, &size, &sptr, 2, US" id=", string_printing(old_id)); |
| 3331 | } |
| 3332 | |
| 3333 | /* If subject logging is turned on, create suitable printing-character |
| 3334 | text. By expanding $h_subject: we make use of the MIME decoding. */ |
| 3335 | |
| 3336 | if ((log_extra_selector & LX_subject) != 0 && subject_header != NULL) |
| 3337 | { |
| 3338 | int i; |
| 3339 | uschar *p = big_buffer; |
| 3340 | uschar *ss = expand_string(US"$h_subject:"); |
| 3341 | |
| 3342 | /* Backslash-quote any double quotes or backslashes so as to make a |
| 3343 | a C-like string, and turn any non-printers into escape sequences. */ |
| 3344 | |
| 3345 | *p++ = '\"'; |
| 3346 | if (*ss != 0) for (i = 0; i < 100 && ss[i] != 0; i++) |
| 3347 | { |
| 3348 | if (ss[i] == '\"' || ss[i] == '\\') *p++ = '\\'; |
| 3349 | *p++ = ss[i]; |
| 3350 | } |
| 3351 | *p++ = '\"'; |
| 3352 | *p = 0; |
| 3353 | s = string_append(s, &size, &sptr, 2, US" T=", string_printing(big_buffer)); |
| 3354 | } |
| 3355 | |
| 3356 | /* Terminate the string: string_cat() and string_append() leave room, but do |
| 3357 | not put the zero in. */ |
| 3358 | |
| 3359 | s[sptr] = 0; |
| 3360 | |
| 3361 | /* While writing to the log, set a flag to cause a call to receive_bomb_out() |
| 3362 | if the log cannot be opened. */ |
| 3363 | |
| 3364 | receive_call_bombout = TRUE; |
| 3365 | log_write(0, LOG_MAIN | |
| 3366 | (((log_extra_selector & LX_received_recipients) != 0)? LOG_RECIPIENTS : 0) | |
| 3367 | (((log_extra_selector & LX_received_sender) != 0)? LOG_SENDER : 0), |
| 3368 | "%s", s); |
| 3369 | receive_call_bombout = FALSE; |
| 3370 | |
| 3371 | /* Log any control actions taken by an ACL or local_scan(). */ |
| 3372 | |
| 3373 | if (deliver_freeze) log_write(0, LOG_MAIN, "frozen by %s", frozen_by); |
| 3374 | if (queue_only_policy) log_write(L_delay_delivery, LOG_MAIN, |
| 3375 | "no immediate delivery: queued by %s", queued_by); |
| 3376 | |
| 3377 | /* Create a message log file if message logs are being used and this message is |
| 3378 | not blackholed. Write the reception stuff to it. We used to leave message log |
| 3379 | creation until the first delivery, but this has proved confusing for somep |
| 3380 | people. */ |
| 3381 | |
| 3382 | if (message_logs && blackholed_by == NULL) |
| 3383 | { |
| 3384 | int fd; |
| 3385 | |
| 3386 | sprintf(CS spool_name, "%s/msglog/%s/%s", spool_directory, message_subdir, |
| 3387 | message_id); |
| 3388 | fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE); |
| 3389 | |
| 3390 | if (fd < 0 && errno == ENOENT) |
| 3391 | { |
| 3392 | uschar temp[16]; |
| 3393 | sprintf(CS temp, "msglog/%s", message_subdir); |
| 3394 | if (message_subdir[0] == 0) temp[6] = 0; |
| 3395 | (void)directory_make(spool_directory, temp, MSGLOG_DIRECTORY_MODE, TRUE); |
| 3396 | fd = Uopen(spool_name, O_WRONLY|O_APPEND|O_CREAT, SPOOL_MODE); |
| 3397 | } |
| 3398 | |
| 3399 | if (fd < 0) |
| 3400 | { |
| 3401 | log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't open message log %s: %s", |
| 3402 | spool_name, strerror(errno)); |
| 3403 | } |
| 3404 | |
| 3405 | else |
| 3406 | { |
| 3407 | FILE *message_log = fdopen(fd, "a"); |
| 3408 | if (message_log == NULL) |
| 3409 | { |
| 3410 | log_write(0, LOG_MAIN|LOG_PANIC, "Couldn't fdopen message log %s: %s", |
| 3411 | spool_name, strerror(errno)); |
| 3412 | (void)close(fd); |
| 3413 | } |
| 3414 | else |
| 3415 | { |
| 3416 | uschar *now = tod_stamp(tod_log); |
| 3417 | fprintf(message_log, "%s Received from %s\n", now, s+3); |
| 3418 | if (deliver_freeze) fprintf(message_log, "%s frozen by %s\n", now, |
| 3419 | frozen_by); |
| 3420 | if (queue_only_policy) fprintf(message_log, |
| 3421 | "%s no immediate delivery: queued by %s\n", now, queued_by); |
| 3422 | (void)fclose(message_log); |
| 3423 | } |
| 3424 | } |
| 3425 | } |
| 3426 | |
| 3427 | store_reset(s); /* The store for the main log message can be reused */ |
| 3428 | |
| 3429 | /* If the message is frozen, and freeze_tell is set, do the telling. */ |
| 3430 | |
| 3431 | if (deliver_freeze && freeze_tell != NULL && freeze_tell[0] != 0) |
| 3432 | { |
| 3433 | moan_tell_someone(freeze_tell, NULL, US"Message frozen on arrival", |
| 3434 | "Message %s was frozen on arrival by %s.\nThe sender is <%s>.\n", |
| 3435 | message_id, frozen_by, sender_address); |
| 3436 | } |
| 3437 | |
| 3438 | |
| 3439 | /* Either a message has been successfully received and written to the two spool |
| 3440 | files, or an error in writing the spool has occurred for an SMTP message, or |
| 3441 | an SMTP message has been rejected because of a bad sender. (For a non-SMTP |
| 3442 | message we will have already given up because there's no point in carrying on!) |
| 3443 | In either event, we must now close (and thereby unlock) the data file. In the |
| 3444 | successful case, this leaves the message on the spool, ready for delivery. In |
| 3445 | the error case, the spool file will be deleted. Then tidy up store, interact |
| 3446 | with an SMTP call if necessary, and return. |
| 3447 | |
| 3448 | A fflush() was done earlier in the expectation that any write errors on the |
| 3449 | data file will be flushed(!) out thereby. Nevertheless, it is theoretically |
| 3450 | possible for fclose() to fail - but what to do? What has happened to the lock |
| 3451 | if this happens? */ |
| 3452 | |
| 3453 | TIDYUP: |
| 3454 | process_info[process_info_len] = 0; /* Remove message id */ |
| 3455 | if (data_file != NULL) (void)fclose(data_file); /* Frees the lock */ |
| 3456 | |
| 3457 | /* Now reset signal handlers to their defaults */ |
| 3458 | |
| 3459 | signal(SIGTERM, SIG_DFL); |
| 3460 | signal(SIGINT, SIG_DFL); |
| 3461 | |
| 3462 | /* Tell an SMTP caller the state of play, and arrange to return the SMTP return |
| 3463 | value, which defaults TRUE - meaning there may be more incoming messages from |
| 3464 | this connection. For non-SMTP callers (where there is only ever one message), |
| 3465 | the default is FALSE. */ |
| 3466 | |
| 3467 | if (smtp_input) |
| 3468 | { |
| 3469 | yield = smtp_yield; |
| 3470 | |
| 3471 | /* Handle interactive SMTP callers. After several kinds of error, smtp_reply |
| 3472 | is set to the response. However, after an ACL error or local_scan() error, |
| 3473 | the response has already been sent, and smtp_reply is an empty string to |
| 3474 | indicate this. */ |
| 3475 | |
| 3476 | if (!smtp_batched_input) |
| 3477 | { |
| 3478 | if (smtp_reply == NULL) |
| 3479 | { |
| 3480 | if (fake_response != OK) |
| 3481 | smtp_respond(fake_response == DEFER ? 450 : 550, |
| 3482 | TRUE, fake_response_text); |
| 3483 | else |
| 3484 | smtp_printf("250 OK id=%s\r\n", message_id); |
| 3485 | if (host_checking) |
| 3486 | fprintf(stdout, |
| 3487 | "\n**** SMTP testing: that is not a real message id!\n\n"); |
| 3488 | } |
| 3489 | else if (smtp_reply[0] != 0) |
| 3490 | { |
| 3491 | if (fake_response != OK && (smtp_reply[0] == '2')) |
| 3492 | smtp_respond(fake_response == DEFER ? 450 : 550, |
| 3493 | TRUE, fake_response_text); |
| 3494 | else |
| 3495 | smtp_printf("%.1024s\r\n", smtp_reply); |
| 3496 | } |
| 3497 | } |
| 3498 | |
| 3499 | /* For batched SMTP, generate an error message on failure, and do |
| 3500 | nothing on success. The function moan_smtp_batch() does not return - |
| 3501 | it exits from the program with a non-zero return code. */ |
| 3502 | |
| 3503 | else if (smtp_reply != NULL) moan_smtp_batch(NULL, "%s", smtp_reply); |
| 3504 | } |
| 3505 | |
| 3506 | |
| 3507 | /* If blackholing, we can immediately log this message's sad fate. The data |
| 3508 | file has already been unlinked, and the header file was never written to disk. |
| 3509 | We must now indicate that nothing was received, to prevent a delivery from |
| 3510 | starting. */ |
| 3511 | |
| 3512 | if (blackholed_by != NULL) |
| 3513 | { |
| 3514 | uschar *detail = (local_scan_data != NULL)? |
| 3515 | string_printing(local_scan_data) : |
| 3516 | string_sprintf("(%s discarded recipients)", blackholed_by); |
| 3517 | log_write(0, LOG_MAIN, "=> blackhole %s%s", detail, blackhole_log_msg); |
| 3518 | log_write(0, LOG_MAIN, "Completed"); |
| 3519 | message_id[0] = 0; |
| 3520 | } |
| 3521 | |
| 3522 | /* Reset headers so that logging of rejects for a subsequent message doesn't |
| 3523 | include them. It is also important to set header_last = NULL before exiting |
| 3524 | from this function, as this prevents certain rewrites that might happen during |
| 3525 | subsequent verifying (of another incoming message) from trying to add headers |
| 3526 | when they shouldn't. */ |
| 3527 | |
| 3528 | header_list = header_last = NULL; |
| 3529 | |
| 3530 | return yield; /* TRUE if more messages (SMTP only) */ |
| 3531 | } |
| 3532 | |
| 3533 | /* End of receive.c */ |