Testsuite: remove old testcase for reverse_host_lookup/defer_ok
[exim.git] / src / src / spam.c
CommitLineData
8523533c
TK
1/*************************************************
2* Exim - an Internet mail transport agent *
3*************************************************/
4
5/* Copyright (c) Tom Kistner <tom@duncanthrax.net> 2003-???? */
6/* License: GPL */
7
8/* Code for calling spamassassin's spamd. Called from acl.c. */
9
10#include "exim.h"
11#ifdef WITH_CONTENT_SCAN
12#include "spam.h"
13
14uschar spam_score_buffer[16];
15uschar spam_score_int_buffer[16];
16uschar spam_bar_buffer[128];
17uschar spam_report_buffer[32600];
18uschar prev_user_name[128] = "";
19int spam_ok = 0;
20int spam_rc = 0;
f7274286 21uschar *prev_spamd_address_work = NULL;
8523533c 22
c007c974
JH
23int
24spam(uschar **listptr)
25{
8523533c
TK
26 int sep = 0;
27 uschar *list = *listptr;
28 uschar *user_name;
29 uschar user_name_buffer[128];
f7b63901 30 unsigned long mbox_size;
8523533c 31 FILE *mbox_file;
0f501486 32 int spamd_sock = -1;
8523533c 33 uschar spamd_buffer[32600];
cfe75fc3 34 int i, j, offset, result;
8523533c
TK
35 uschar spamd_version[8];
36 uschar spamd_score_char;
37 double spamd_threshold, spamd_score;
38 int spamd_report_offset;
39 uschar *p,*q;
40 int override = 0;
cfe75fc3
PH
41 time_t start;
42 size_t read, wrote;
8523533c 43 struct sockaddr_un server;
f452e07e 44#ifndef NO_POLL_H
cfe75fc3 45 struct pollfd pollfd;
25257489
PH
46#else /* Patch posted by Erik ? for OS X */
47 struct timeval select_tv; /* and applied by PH */
48 fd_set select_fd;
f452e07e 49#endif
b6e6e716 50 uschar *spamd_address_work;
b6fbf22d 51 static const uschar * loglabel = US"spam acl condition:";
8523533c 52
5614ee86 53 /* stop compiler warning */
91ecef39 54 result = 0;
5614ee86 55
8523533c
TK
56 /* find the username from the option list */
57 if ((user_name = string_nextinlist(&list, &sep,
58 user_name_buffer,
ddcf2b5f
JH
59 sizeof(user_name_buffer))) == NULL)
60 {
8523533c
TK
61 /* no username given, this means no scanning should be done */
62 return FAIL;
ddcf2b5f 63 }
8523533c
TK
64
65 /* if username is "0" or "false", do not scan */
66 if ( (Ustrcmp(user_name,"0") == 0) ||
ddcf2b5f 67 (strcmpic(user_name,US"false") == 0) )
8523533c 68 return FAIL;
8523533c
TK
69
70 /* if there is an additional option, check if it is "true" */
ddcf2b5f 71 if (strcmpic(list,US"true") == 0)
8523533c
TK
72 /* in that case, always return true later */
73 override = 1;
8523533c 74
f7274286 75 /* expand spamd_address if needed */
ddcf2b5f
JH
76 if (*spamd_address == '$')
77 {
f7274286 78 spamd_address_work = expand_string(spamd_address);
ddcf2b5f
JH
79 if (spamd_address_work == NULL)
80 {
f7274286 81 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8
JH
82 "%s spamd_address starts with $, but expansion failed: %s",
83 loglabel, expand_string_message);
f7274286 84 return DEFER;
ddcf2b5f 85 }
f7274286 86 }
f7274286
PP
87 else
88 spamd_address_work = spamd_address;
89
90 /* check if previous spamd_address was expanded and has changed. dump cached results if so */
ddcf2b5f
JH
91 if ( spam_ok
92 && prev_spamd_address_work != NULL
93 && Ustrcmp(prev_spamd_address_work, spamd_address_work) != 0
94 )
f7274286 95 spam_ok = 0;
f7274286 96
8e669ac1 97 /* if we scanned for this username last time, just return */
e8bc7fca
JH
98 if (spam_ok && Ustrcmp(prev_user_name, user_name) == 0)
99 return override ? OK : spam_rc;
8e669ac1 100
8523533c 101 /* make sure the eml mbox file is spooled up */
8544e77a 102 mbox_file = spool_mbox(&mbox_size, NULL);
8e669ac1 103
ddcf2b5f
JH
104 if (mbox_file == NULL)
105 {
8523533c
TK
106 /* error while spooling */
107 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8 108 "%s error while creating mbox spool file", loglabel);
8523533c 109 return DEFER;
ddcf2b5f 110 }
8523533c 111
cfe75fc3 112 start = time(NULL);
b6e6e716 113
8523533c 114 /* socket does not start with '/' -> network socket */
ddcf2b5f
JH
115 if (*spamd_address_work != '/')
116 {
8523533c 117 int num_servers = 0;
29cfeb94 118 int current_server;
8523533c 119 uschar *address = NULL;
e1e7cfcb 120 uschar *spamd_address_list_ptr = spamd_address_work;
8523533c
TK
121 uschar address_buffer[256];
122 spamd_address_container * spamd_address_vector[32];
123
124 /* Check how many spamd servers we have
125 and register their addresses */
126 while ((address = string_nextinlist(&spamd_address_list_ptr, &sep,
127 address_buffer,
ddcf2b5f
JH
128 sizeof(address_buffer))) != NULL)
129 {
8e669ac1 130
29cfeb94 131 /* Potential memory leak as we never free the store. */
8523533c
TK
132 spamd_address_container *this_spamd =
133 (spamd_address_container *)store_get(sizeof(spamd_address_container));
8e669ac1 134
8523533c 135 /* grok spamd address and port */
d6e35dd0 136 if (sscanf(CS address, "%23s %u", this_spamd->tcp_addr, &this_spamd->tcp_port) != 2)
e252eb8c 137 {
8523533c 138 log_write(0, LOG_MAIN,
a56cc2b8 139 "%s warning - invalid spamd address: '%s'", loglabel, address);
8523533c 140 continue;
ddcf2b5f 141 }
8e669ac1 142
8523533c 143 spamd_address_vector[num_servers] = this_spamd;
a56cc2b8
JH
144 if ( ++num_servers
145 >= sizeof(spamd_address_vector)/sizeof(spamd_address_vector[0]))
8523533c 146 break;
ddcf2b5f 147 }
8e669ac1 148
8523533c 149 /* check if we have at least one server */
ddcf2b5f
JH
150 if (!num_servers)
151 {
8523533c 152 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8
JH
153 "%s no useable spamd server addresses in spamd_address configuration option.",
154 loglabel);
f1e894f3 155 (void)fclose(mbox_file);
8523533c 156 return DEFER;
ddcf2b5f 157 }
8523533c 158
a56cc2b8 159 while (num_servers > 0)
ddcf2b5f 160 {
2e64baa9 161 int i;
8523533c 162
29cfeb94 163 /* Randomly pick a server to try */
a56cc2b8 164 current_server = random_number(num_servers);
8e669ac1 165
8523533c
TK
166 debug_printf("trying server %s, port %u\n",
167 spamd_address_vector[current_server]->tcp_addr,
168 spamd_address_vector[current_server]->tcp_port);
8e669ac1 169
8523533c 170 /* contact a spamd */
a56cc2b8 171 if ((spamd_sock = ip_socket(SOCK_STREAM, AF_INET)) < 0)
ddcf2b5f 172 {
8523533c 173 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8 174 "%s error creating IP socket for spamd", loglabel);
f1e894f3 175 (void)fclose(mbox_file);
8e669ac1 176 return DEFER;
ddcf2b5f 177 }
8e669ac1 178
a56cc2b8
JH
179 if (ip_connect(spamd_sock,
180 AF_INET,
181 spamd_address_vector[current_server]->tcp_addr,
182 spamd_address_vector[current_server]->tcp_port,
183 5 ) > -1)
8523533c
TK
184 /* connection OK */
185 break;
8e669ac1 186
8523533c 187 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8
JH
188 "%s warning - spamd connection to %s, port %u failed: %s",
189 loglabel,
8523533c
TK
190 spamd_address_vector[current_server]->tcp_addr,
191 spamd_address_vector[current_server]->tcp_port,
192 strerror(errno));
29cfeb94
PP
193
194 (void)close(spamd_sock);
195
196 /* Remove the server from the list. XXX We should free the memory */
197 num_servers--;
a56cc2b8 198 for (i = current_server; i < num_servers; i++)
29cfeb94 199 spamd_address_vector[i] = spamd_address_vector[i+1];
ddcf2b5f 200 }
29cfeb94 201
a56cc2b8 202 if (num_servers == 0)
ddcf2b5f 203 {
a56cc2b8 204 log_write(0, LOG_MAIN|LOG_PANIC, "%s all spamd servers failed", loglabel);
29cfeb94
PP
205 (void)fclose(mbox_file);
206 return DEFER;
ddcf2b5f 207 }
29cfeb94 208 }
ddcf2b5f
JH
209 else
210 {
8523533c
TK
211 /* open the local socket */
212
ddcf2b5f
JH
213 if ((spamd_sock = socket(AF_UNIX, SOCK_STREAM, 0)) < 0)
214 {
8523533c 215 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8
JH
216 "%s spamd: unable to acquire socket (%s)",
217 loglabel,
8523533c 218 strerror(errno));
f1e894f3 219 (void)fclose(mbox_file);
8523533c 220 return DEFER;
ddcf2b5f 221 }
8523533c
TK
222
223 server.sun_family = AF_UNIX;
b6e6e716 224 Ustrcpy(server.sun_path, spamd_address_work);
8523533c 225
ddcf2b5f
JH
226 if (connect(spamd_sock, (struct sockaddr *) &server, sizeof(struct sockaddr_un)) < 0)
227 {
8523533c 228 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8
JH
229 "%s spamd: unable to connect to UNIX socket %s (%s)",
230 loglabel,
b6e6e716 231 spamd_address_work, strerror(errno) );
f1e894f3
PH
232 (void)fclose(mbox_file);
233 (void)close(spamd_sock);
8523533c 234 return DEFER;
ddcf2b5f 235 }
8523533c
TK
236 }
237
ddcf2b5f
JH
238 if (spamd_sock == -1)
239 {
0f501486
PP
240 log_write(0, LOG_MAIN|LOG_PANIC,
241 "programming fault, spamd_sock unexpectedly unset");
242 (void)fclose(mbox_file);
243 (void)close(spamd_sock);
244 return DEFER;
ddcf2b5f 245 }
0f501486 246
8523533c 247 /* now we are connected to spamd on spamd_sock */
b07e6aa3 248 (void)string_format(spamd_buffer,
8523533c 249 sizeof(spamd_buffer),
f7b63901 250 "REPORT SPAMC/1.2\r\nUser: %s\r\nContent-length: %ld\r\n\r\n",
8523533c
TK
251 user_name,
252 mbox_size);
253
254 /* send our request */
ddcf2b5f
JH
255 if (send(spamd_sock, spamd_buffer, Ustrlen(spamd_buffer), 0) < 0)
256 {
f1e894f3 257 (void)close(spamd_sock);
8523533c 258 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8 259 "%s spamd send failed: %s", loglabel, strerror(errno));
f1e894f3
PH
260 (void)fclose(mbox_file);
261 (void)close(spamd_sock);
8523533c 262 return DEFER;
ddcf2b5f 263 }
8523533c
TK
264
265 /* now send the file */
cfe75fc3
PH
266 /* spamd sometimes accepts conections but doesn't read data off
267 * the connection. We make the file descriptor non-blocking so
268 * that the write will only write sufficient data without blocking
269 * and we poll the desciptor to make sure that we can write without
270 * blocking. Short writes are gracefully handled and if the whole
271 * trasaction takes too long it is aborted.
25257489
PH
272 * Note: poll() is not supported in OSX 10.2 and is reported to be
273 * broken in more recent versions (up to 10.4).
cfe75fc3 274 */
f452e07e 275#ifndef NO_POLL_H
cfe75fc3
PH
276 pollfd.fd = spamd_sock;
277 pollfd.events = POLLOUT;
f452e07e 278#endif
ff790e47 279 (void)fcntl(spamd_sock, F_SETFL, O_NONBLOCK);
ddcf2b5f
JH
280 do
281 {
cfe75fc3 282 read = fread(spamd_buffer,1,sizeof(spamd_buffer),mbox_file);
ddcf2b5f
JH
283 if (read > 0)
284 {
cfe75fc3
PH
285 offset = 0;
286again:
f452e07e 287#ifndef NO_POLL_H
cfe75fc3 288 result = poll(&pollfd, 1, 1000);
25257489
PH
289
290/* Patch posted by Erik ? for OS X and applied by PH */
291#else
292 select_tv.tv_sec = 1;
293 select_tv.tv_usec = 0;
294 FD_ZERO(&select_fd);
295 FD_SET(spamd_sock, &select_fd);
296 result = select(spamd_sock+1, NULL, &select_fd, NULL, &select_tv);
297#endif
298/* End Erik's patch */
299
cfe75fc3 300 if (result == -1 && errno == EINTR)
25257489 301 goto again;
ddcf2b5f
JH
302 else if (result < 1)
303 {
cfe75fc3
PH
304 if (result == -1)
305 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8 306 "%s %s on spamd socket", loglabel, strerror(errno));
ddcf2b5f
JH
307 else
308 {
cfe75fc3 309 if (time(NULL) - start < SPAMD_TIMEOUT)
c007c974 310 goto again;
cfe75fc3 311 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8 312 "%s timed out writing spamd socket", loglabel);
ddcf2b5f 313 }
f1e894f3
PH
314 (void)close(spamd_sock);
315 (void)fclose(mbox_file);
8523533c 316 return DEFER;
ddcf2b5f 317 }
25257489 318
cfe75fc3 319 wrote = send(spamd_sock,spamd_buffer + offset,read - offset,0);
8d7d227d 320 if (wrote == -1)
ddcf2b5f
JH
321 {
322 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8 323 "%s %s on spamd socket", loglabel, strerror(errno));
f1e894f3
PH
324 (void)close(spamd_sock);
325 (void)fclose(mbox_file);
8d7d227d 326 return DEFER;
ddcf2b5f
JH
327 }
328 if (offset + wrote != read)
329 {
cfe75fc3
PH
330 offset += wrote;
331 goto again;
ddcf2b5f 332 }
cfe75fc3
PH
333 }
334 }
cfe75fc3 335 while (!feof(mbox_file) && !ferror(mbox_file));
ddcf2b5f
JH
336
337 if (ferror(mbox_file))
338 {
cfe75fc3 339 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8 340 "%s error reading spool file: %s", loglabel, strerror(errno));
f1e894f3
PH
341 (void)close(spamd_sock);
342 (void)fclose(mbox_file);
cfe75fc3 343 return DEFER;
ddcf2b5f 344 }
8523533c 345
f1e894f3 346 (void)fclose(mbox_file);
8523533c
TK
347
348 /* we're done sending, close socket for writing */
349 shutdown(spamd_sock,SHUT_WR);
8e669ac1 350
cfe75fc3
PH
351 /* read spamd response using what's left of the timeout.
352 */
8523533c
TK
353 memset(spamd_buffer, 0, sizeof(spamd_buffer));
354 offset = 0;
ddcf2b5f 355 while ((i = ip_recv(spamd_sock,
8523533c
TK
356 spamd_buffer + offset,
357 sizeof(spamd_buffer) - offset - 1,
ddcf2b5f 358 SPAMD_TIMEOUT - time(NULL) + start)) > 0 )
8523533c 359 offset += i;
8523533c
TK
360
361 /* error handling */
ddcf2b5f
JH
362 if (i <= 0 && errno != 0)
363 {
8523533c 364 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8 365 "%s error reading from spamd socket: %s", loglabel, strerror(errno));
f1e894f3 366 (void)close(spamd_sock);
8523533c 367 return DEFER;
ddcf2b5f 368 }
8523533c
TK
369
370 /* reading done */
f1e894f3 371 (void)close(spamd_sock);
8523533c
TK
372
373 /* dig in the spamd output and put the report in a multiline header, if requested */
ddcf2b5f
JH
374 if (sscanf(CS spamd_buffer,
375 "SPAMD/%7s 0 EX_OK\r\nContent-length: %*u\r\n\r\n%lf/%lf\r\n%n",
376 spamd_version, &spamd_score, &spamd_threshold,
377 &spamd_report_offset) != 3)
378 {
8e669ac1 379
8523533c 380 /* try to fall back to pre-2.50 spamd output */
ddcf2b5f
JH
381 if (sscanf(CS spamd_buffer,
382 "SPAMD/%7s 0 EX_OK\r\nSpam: %*s ; %lf / %lf\r\n\r\n%n",
383 spamd_version, &spamd_score, &spamd_threshold,
384 &spamd_report_offset) != 3 )
385 {
8523533c 386 log_write(0, LOG_MAIN|LOG_PANIC,
a56cc2b8 387 "%s cannot parse spamd output", loglabel);
8523533c 388 return DEFER;
ddcf2b5f
JH
389 }
390 }
8523533c
TK
391
392 /* Create report. Since this is a multiline string,
393 we must hack it into shape first */
394 p = &spamd_buffer[spamd_report_offset];
395 q = spam_report_buffer;
ddcf2b5f
JH
396 while (*p != '\0')
397 {
8523533c 398 /* skip \r */
ddcf2b5f
JH
399 if (*p == '\r')
400 {
8523533c
TK
401 p++;
402 continue;
ddcf2b5f
JH
403 }
404 *q++ = *p;
405 if (*p++ == '\n')
406 {
89dec7b6
TF
407 /* add an extra space after the newline to ensure
408 that it is treated as a header continuation line */
ddcf2b5f
JH
409 *q++ = ' ';
410 }
411 }
8523533c 412 /* NULL-terminate */
ddcf2b5f 413 *q-- = '\0';
8523533c 414 /* cut off trailing leftovers */
ddcf2b5f
JH
415 while (*q <= ' ')
416 *q-- = '\0';
417
8523533c
TK
418 spam_report = spam_report_buffer;
419
420 /* create spam bar */
421 spamd_score_char = spamd_score > 0 ? '+' : '-';
422 j = abs((int)(spamd_score));
423 i = 0;
ddcf2b5f
JH
424 if (j != 0)
425 while ((i < j) && (i <= MAX_SPAM_BAR_CHARS))
8523533c 426 spam_bar_buffer[i++] = spamd_score_char;
ddcf2b5f
JH
427 else
428 {
8523533c
TK
429 spam_bar_buffer[0] = '/';
430 i = 1;
ddcf2b5f 431 }
8523533c
TK
432 spam_bar_buffer[i] = '\0';
433 spam_bar = spam_bar_buffer;
434
435 /* create "float" spam score */
b07e6aa3 436 (void)string_format(spam_score_buffer, sizeof(spam_score_buffer),"%.1f", spamd_score);
8523533c
TK
437 spam_score = spam_score_buffer;
438
439 /* create "int" spam score */
440 j = (int)((spamd_score + 0.001)*10);
b07e6aa3 441 (void)string_format(spam_score_int_buffer, sizeof(spam_score_int_buffer), "%d", j);
8523533c
TK
442 spam_score_int = spam_score_int_buffer;
443
444 /* compare threshold against score */
ddcf2b5f
JH
445 if (spamd_score >= spamd_threshold)
446 {
8523533c
TK
447 /* spam as determined by user's threshold */
448 spam_rc = OK;
ddcf2b5f
JH
449 }
450 else
451 {
8523533c
TK
452 /* not spam */
453 spam_rc = FAIL;
ddcf2b5f 454 }
8e669ac1 455
f7274286 456 /* remember expanded spamd_address if needed */
ddcf2b5f 457 if (spamd_address_work != spamd_address)
f7274286 458 prev_spamd_address_work = string_copy(spamd_address_work);
ddcf2b5f 459
f7274286
PP
460 /* remember user name and "been here" for it */
461 Ustrcpy(prev_user_name, user_name);
462 spam_ok = 1;
8e669ac1 463
ddcf2b5f 464 if (override) /* always return OK, no matter what the score */
8523533c 465 return OK;
ddcf2b5f 466 else
8523533c 467 return spam_rc;
8523533c
TK
468}
469
470#endif