Reformat to project standard
[exim.git] / src / src / spam.c
CommitLineData
8523533c
TK
1/*************************************************
2* Exim - an Internet mail transport agent *
3*************************************************/
4
5/* Copyright (c) Tom Kistner <tom@duncanthrax.net> 2003-???? */
6/* License: GPL */
7
8/* Code for calling spamassassin's spamd. Called from acl.c. */
9
10#include "exim.h"
11#ifdef WITH_CONTENT_SCAN
12#include "spam.h"
13
14uschar spam_score_buffer[16];
15uschar spam_score_int_buffer[16];
16uschar spam_bar_buffer[128];
17uschar spam_report_buffer[32600];
18uschar prev_user_name[128] = "";
19int spam_ok = 0;
20int spam_rc = 0;
f7274286 21uschar *prev_spamd_address_work = NULL;
8523533c 22
c007c974
JH
23int
24spam(uschar **listptr)
25{
8523533c
TK
26 int sep = 0;
27 uschar *list = *listptr;
28 uschar *user_name;
29 uschar user_name_buffer[128];
f7b63901 30 unsigned long mbox_size;
8523533c 31 FILE *mbox_file;
0f501486 32 int spamd_sock = -1;
8523533c 33 uschar spamd_buffer[32600];
cfe75fc3 34 int i, j, offset, result;
8523533c
TK
35 uschar spamd_version[8];
36 uschar spamd_score_char;
37 double spamd_threshold, spamd_score;
38 int spamd_report_offset;
39 uschar *p,*q;
40 int override = 0;
cfe75fc3
PH
41 time_t start;
42 size_t read, wrote;
8523533c 43 struct sockaddr_un server;
f452e07e 44#ifndef NO_POLL_H
cfe75fc3 45 struct pollfd pollfd;
25257489
PH
46#else /* Patch posted by Erik ? for OS X */
47 struct timeval select_tv; /* and applied by PH */
48 fd_set select_fd;
f452e07e 49#endif
b6e6e716 50 uschar *spamd_address_work;
8523533c 51
5614ee86 52 /* stop compiler warning */
91ecef39 53 result = 0;
5614ee86 54
8523533c
TK
55 /* find the username from the option list */
56 if ((user_name = string_nextinlist(&list, &sep,
57 user_name_buffer,
ddcf2b5f
JH
58 sizeof(user_name_buffer))) == NULL)
59 {
8523533c
TK
60 /* no username given, this means no scanning should be done */
61 return FAIL;
ddcf2b5f 62 }
8523533c
TK
63
64 /* if username is "0" or "false", do not scan */
65 if ( (Ustrcmp(user_name,"0") == 0) ||
ddcf2b5f 66 (strcmpic(user_name,US"false") == 0) )
8523533c 67 return FAIL;
8523533c
TK
68
69 /* if there is an additional option, check if it is "true" */
ddcf2b5f 70 if (strcmpic(list,US"true") == 0)
8523533c
TK
71 /* in that case, always return true later */
72 override = 1;
8523533c 73
f7274286 74 /* expand spamd_address if needed */
ddcf2b5f
JH
75 if (*spamd_address == '$')
76 {
f7274286 77 spamd_address_work = expand_string(spamd_address);
ddcf2b5f
JH
78 if (spamd_address_work == NULL)
79 {
f7274286
PP
80 log_write(0, LOG_MAIN|LOG_PANIC,
81 "spamassassin acl condition: spamd_address starts with $, but expansion failed: %s", expand_string_message);
82 return DEFER;
ddcf2b5f 83 }
f7274286 84 }
f7274286
PP
85 else
86 spamd_address_work = spamd_address;
87
88 /* check if previous spamd_address was expanded and has changed. dump cached results if so */
ddcf2b5f
JH
89 if ( spam_ok
90 && prev_spamd_address_work != NULL
91 && Ustrcmp(prev_spamd_address_work, spamd_address_work) != 0
92 )
f7274286 93 spam_ok = 0;
f7274286 94
8e669ac1 95 /* if we scanned for this username last time, just return */
ddcf2b5f 96 if ( spam_ok && Ustrcmp(prev_user_name, user_name) == 0)
8523533c
TK
97 if (override)
98 return OK;
99 else
100 return spam_rc;
8e669ac1 101
8523533c 102 /* make sure the eml mbox file is spooled up */
8544e77a 103 mbox_file = spool_mbox(&mbox_size, NULL);
8e669ac1 104
ddcf2b5f
JH
105 if (mbox_file == NULL)
106 {
8523533c
TK
107 /* error while spooling */
108 log_write(0, LOG_MAIN|LOG_PANIC,
109 "spam acl condition: error while creating mbox spool file");
110 return DEFER;
ddcf2b5f 111 }
8523533c 112
cfe75fc3 113 start = time(NULL);
b6e6e716 114
8523533c 115 /* socket does not start with '/' -> network socket */
ddcf2b5f
JH
116 if (*spamd_address_work != '/')
117 {
8523533c 118 int num_servers = 0;
29cfeb94 119 int current_server;
8523533c 120 uschar *address = NULL;
e1e7cfcb 121 uschar *spamd_address_list_ptr = spamd_address_work;
8523533c
TK
122 uschar address_buffer[256];
123 spamd_address_container * spamd_address_vector[32];
124
125 /* Check how many spamd servers we have
126 and register their addresses */
127 while ((address = string_nextinlist(&spamd_address_list_ptr, &sep,
128 address_buffer,
ddcf2b5f
JH
129 sizeof(address_buffer))) != NULL)
130 {
8e669ac1 131
29cfeb94 132 /* Potential memory leak as we never free the store. */
8523533c
TK
133 spamd_address_container *this_spamd =
134 (spamd_address_container *)store_get(sizeof(spamd_address_container));
8e669ac1 135
8523533c 136 /* grok spamd address and port */
e252eb8c
JH
137 if (sscanf(CS address, "%23s %u", this_spamd->tcp_addr, &(this_spamd->tcp_port)) != 2)
138 {
8523533c
TK
139 log_write(0, LOG_MAIN,
140 "spam acl condition: warning - invalid spamd address: '%s'", address);
141 continue;
ddcf2b5f 142 }
8e669ac1 143
8523533c 144 spamd_address_vector[num_servers] = this_spamd;
ddcf2b5f 145 if (++num_servers > 31)
8523533c 146 break;
ddcf2b5f 147 }
8e669ac1 148
8523533c 149 /* check if we have at least one server */
ddcf2b5f
JH
150 if (!num_servers)
151 {
8523533c
TK
152 log_write(0, LOG_MAIN|LOG_PANIC,
153 "spam acl condition: no useable spamd server addresses in spamd_address configuration option.");
f1e894f3 154 (void)fclose(mbox_file);
8523533c 155 return DEFER;
ddcf2b5f 156 }
8523533c 157
ddcf2b5f
JH
158 while ( num_servers > 0 )
159 {
2e64baa9 160 int i;
8523533c 161
29cfeb94
PP
162 /* Randomly pick a server to try */
163 current_server = random_number( num_servers );
8e669ac1 164
8523533c
TK
165 debug_printf("trying server %s, port %u\n",
166 spamd_address_vector[current_server]->tcp_addr,
167 spamd_address_vector[current_server]->tcp_port);
8e669ac1 168
8523533c 169 /* contact a spamd */
ddcf2b5f
JH
170 if ( (spamd_sock = ip_socket(SOCK_STREAM, AF_INET)) < 0)
171 {
8523533c
TK
172 log_write(0, LOG_MAIN|LOG_PANIC,
173 "spam acl condition: error creating IP socket for spamd");
f1e894f3 174 (void)fclose(mbox_file);
8e669ac1 175 return DEFER;
ddcf2b5f 176 }
8e669ac1 177
8523533c
TK
178 if (ip_connect( spamd_sock,
179 AF_INET,
180 spamd_address_vector[current_server]->tcp_addr,
181 spamd_address_vector[current_server]->tcp_port,
ddcf2b5f 182 5 ) > -1)
8523533c
TK
183 /* connection OK */
184 break;
8e669ac1 185
8523533c
TK
186 log_write(0, LOG_MAIN|LOG_PANIC,
187 "spam acl condition: warning - spamd connection to %s, port %u failed: %s",
188 spamd_address_vector[current_server]->tcp_addr,
189 spamd_address_vector[current_server]->tcp_port,
190 strerror(errno));
29cfeb94
PP
191
192 (void)close(spamd_sock);
193
194 /* Remove the server from the list. XXX We should free the memory */
195 num_servers--;
ddcf2b5f 196 for ( i = current_server; i < num_servers; i++ )
29cfeb94 197 spamd_address_vector[i] = spamd_address_vector[i+1];
ddcf2b5f 198 }
29cfeb94 199
ddcf2b5f
JH
200 if ( num_servers == 0 )
201 {
29cfeb94
PP
202 log_write(0, LOG_MAIN|LOG_PANIC, "spam acl condition: all spamd servers failed");
203 (void)fclose(mbox_file);
204 return DEFER;
ddcf2b5f 205 }
29cfeb94 206 }
ddcf2b5f
JH
207 else
208 {
8523533c
TK
209 /* open the local socket */
210
ddcf2b5f
JH
211 if ((spamd_sock = socket(AF_UNIX, SOCK_STREAM, 0)) < 0)
212 {
8523533c
TK
213 log_write(0, LOG_MAIN|LOG_PANIC,
214 "malware acl condition: spamd: unable to acquire socket (%s)",
215 strerror(errno));
f1e894f3 216 (void)fclose(mbox_file);
8523533c 217 return DEFER;
ddcf2b5f 218 }
8523533c
TK
219
220 server.sun_family = AF_UNIX;
b6e6e716 221 Ustrcpy(server.sun_path, spamd_address_work);
8523533c 222
ddcf2b5f
JH
223 if (connect(spamd_sock, (struct sockaddr *) &server, sizeof(struct sockaddr_un)) < 0)
224 {
8523533c
TK
225 log_write(0, LOG_MAIN|LOG_PANIC,
226 "malware acl condition: spamd: unable to connect to UNIX socket %s (%s)",
b6e6e716 227 spamd_address_work, strerror(errno) );
f1e894f3
PH
228 (void)fclose(mbox_file);
229 (void)close(spamd_sock);
8523533c 230 return DEFER;
ddcf2b5f 231 }
8523533c
TK
232 }
233
ddcf2b5f
JH
234 if (spamd_sock == -1)
235 {
0f501486
PP
236 log_write(0, LOG_MAIN|LOG_PANIC,
237 "programming fault, spamd_sock unexpectedly unset");
238 (void)fclose(mbox_file);
239 (void)close(spamd_sock);
240 return DEFER;
ddcf2b5f 241 }
0f501486 242
8523533c 243 /* now we are connected to spamd on spamd_sock */
b07e6aa3 244 (void)string_format(spamd_buffer,
8523533c 245 sizeof(spamd_buffer),
f7b63901 246 "REPORT SPAMC/1.2\r\nUser: %s\r\nContent-length: %ld\r\n\r\n",
8523533c
TK
247 user_name,
248 mbox_size);
249
250 /* send our request */
ddcf2b5f
JH
251 if (send(spamd_sock, spamd_buffer, Ustrlen(spamd_buffer), 0) < 0)
252 {
f1e894f3 253 (void)close(spamd_sock);
8523533c
TK
254 log_write(0, LOG_MAIN|LOG_PANIC,
255 "spam acl condition: spamd send failed: %s", strerror(errno));
f1e894f3
PH
256 (void)fclose(mbox_file);
257 (void)close(spamd_sock);
8523533c 258 return DEFER;
ddcf2b5f 259 }
8523533c
TK
260
261 /* now send the file */
cfe75fc3
PH
262 /* spamd sometimes accepts conections but doesn't read data off
263 * the connection. We make the file descriptor non-blocking so
264 * that the write will only write sufficient data without blocking
265 * and we poll the desciptor to make sure that we can write without
266 * blocking. Short writes are gracefully handled and if the whole
267 * trasaction takes too long it is aborted.
25257489
PH
268 * Note: poll() is not supported in OSX 10.2 and is reported to be
269 * broken in more recent versions (up to 10.4).
cfe75fc3 270 */
f452e07e 271#ifndef NO_POLL_H
cfe75fc3
PH
272 pollfd.fd = spamd_sock;
273 pollfd.events = POLLOUT;
f452e07e 274#endif
ff790e47 275 (void)fcntl(spamd_sock, F_SETFL, O_NONBLOCK);
ddcf2b5f
JH
276 do
277 {
cfe75fc3 278 read = fread(spamd_buffer,1,sizeof(spamd_buffer),mbox_file);
ddcf2b5f
JH
279 if (read > 0)
280 {
cfe75fc3
PH
281 offset = 0;
282again:
f452e07e 283#ifndef NO_POLL_H
cfe75fc3 284 result = poll(&pollfd, 1, 1000);
25257489
PH
285
286/* Patch posted by Erik ? for OS X and applied by PH */
287#else
288 select_tv.tv_sec = 1;
289 select_tv.tv_usec = 0;
290 FD_ZERO(&select_fd);
291 FD_SET(spamd_sock, &select_fd);
292 result = select(spamd_sock+1, NULL, &select_fd, NULL, &select_tv);
293#endif
294/* End Erik's patch */
295
cfe75fc3 296 if (result == -1 && errno == EINTR)
25257489 297 goto again;
ddcf2b5f
JH
298 else if (result < 1)
299 {
cfe75fc3
PH
300 if (result == -1)
301 log_write(0, LOG_MAIN|LOG_PANIC,
302 "spam acl condition: %s on spamd socket", strerror(errno));
ddcf2b5f
JH
303 else
304 {
cfe75fc3 305 if (time(NULL) - start < SPAMD_TIMEOUT)
c007c974 306 goto again;
cfe75fc3
PH
307 log_write(0, LOG_MAIN|LOG_PANIC,
308 "spam acl condition: timed out writing spamd socket");
ddcf2b5f 309 }
f1e894f3
PH
310 (void)close(spamd_sock);
311 (void)fclose(mbox_file);
8523533c 312 return DEFER;
ddcf2b5f 313 }
25257489 314
cfe75fc3 315 wrote = send(spamd_sock,spamd_buffer + offset,read - offset,0);
8d7d227d 316 if (wrote == -1)
ddcf2b5f
JH
317 {
318 log_write(0, LOG_MAIN|LOG_PANIC,
8d7d227d 319 "spam acl condition: %s on spamd socket", strerror(errno));
f1e894f3
PH
320 (void)close(spamd_sock);
321 (void)fclose(mbox_file);
8d7d227d 322 return DEFER;
ddcf2b5f
JH
323 }
324 if (offset + wrote != read)
325 {
cfe75fc3
PH
326 offset += wrote;
327 goto again;
ddcf2b5f 328 }
cfe75fc3
PH
329 }
330 }
cfe75fc3 331 while (!feof(mbox_file) && !ferror(mbox_file));
ddcf2b5f
JH
332
333 if (ferror(mbox_file))
334 {
cfe75fc3
PH
335 log_write(0, LOG_MAIN|LOG_PANIC,
336 "spam acl condition: error reading spool file: %s", strerror(errno));
f1e894f3
PH
337 (void)close(spamd_sock);
338 (void)fclose(mbox_file);
cfe75fc3 339 return DEFER;
ddcf2b5f 340 }
8523533c 341
f1e894f3 342 (void)fclose(mbox_file);
8523533c
TK
343
344 /* we're done sending, close socket for writing */
345 shutdown(spamd_sock,SHUT_WR);
8e669ac1 346
cfe75fc3
PH
347 /* read spamd response using what's left of the timeout.
348 */
8523533c
TK
349 memset(spamd_buffer, 0, sizeof(spamd_buffer));
350 offset = 0;
ddcf2b5f 351 while ((i = ip_recv(spamd_sock,
8523533c
TK
352 spamd_buffer + offset,
353 sizeof(spamd_buffer) - offset - 1,
ddcf2b5f 354 SPAMD_TIMEOUT - time(NULL) + start)) > 0 )
8523533c 355 offset += i;
8523533c
TK
356
357 /* error handling */
ddcf2b5f
JH
358 if (i <= 0 && errno != 0)
359 {
8523533c
TK
360 log_write(0, LOG_MAIN|LOG_PANIC,
361 "spam acl condition: error reading from spamd socket: %s", strerror(errno));
f1e894f3 362 (void)close(spamd_sock);
8523533c 363 return DEFER;
ddcf2b5f 364 }
8523533c
TK
365
366 /* reading done */
f1e894f3 367 (void)close(spamd_sock);
8523533c
TK
368
369 /* dig in the spamd output and put the report in a multiline header, if requested */
ddcf2b5f
JH
370 if (sscanf(CS spamd_buffer,
371 "SPAMD/%7s 0 EX_OK\r\nContent-length: %*u\r\n\r\n%lf/%lf\r\n%n",
372 spamd_version, &spamd_score, &spamd_threshold,
373 &spamd_report_offset) != 3)
374 {
8e669ac1 375
8523533c 376 /* try to fall back to pre-2.50 spamd output */
ddcf2b5f
JH
377 if (sscanf(CS spamd_buffer,
378 "SPAMD/%7s 0 EX_OK\r\nSpam: %*s ; %lf / %lf\r\n\r\n%n",
379 spamd_version, &spamd_score, &spamd_threshold,
380 &spamd_report_offset) != 3 )
381 {
8523533c
TK
382 log_write(0, LOG_MAIN|LOG_PANIC,
383 "spam acl condition: cannot parse spamd output");
384 return DEFER;
ddcf2b5f
JH
385 }
386 }
8523533c
TK
387
388 /* Create report. Since this is a multiline string,
389 we must hack it into shape first */
390 p = &spamd_buffer[spamd_report_offset];
391 q = spam_report_buffer;
ddcf2b5f
JH
392 while (*p != '\0')
393 {
8523533c 394 /* skip \r */
ddcf2b5f
JH
395 if (*p == '\r')
396 {
8523533c
TK
397 p++;
398 continue;
ddcf2b5f
JH
399 }
400 *q++ = *p;
401 if (*p++ == '\n')
402 {
89dec7b6
TF
403 /* add an extra space after the newline to ensure
404 that it is treated as a header continuation line */
ddcf2b5f
JH
405 *q++ = ' ';
406 }
407 }
8523533c 408 /* NULL-terminate */
ddcf2b5f 409 *q-- = '\0';
8523533c 410 /* cut off trailing leftovers */
ddcf2b5f
JH
411 while (*q <= ' ')
412 *q-- = '\0';
413
8523533c
TK
414 spam_report = spam_report_buffer;
415
416 /* create spam bar */
417 spamd_score_char = spamd_score > 0 ? '+' : '-';
418 j = abs((int)(spamd_score));
419 i = 0;
ddcf2b5f
JH
420 if (j != 0)
421 while ((i < j) && (i <= MAX_SPAM_BAR_CHARS))
8523533c 422 spam_bar_buffer[i++] = spamd_score_char;
ddcf2b5f
JH
423 else
424 {
8523533c
TK
425 spam_bar_buffer[0] = '/';
426 i = 1;
ddcf2b5f 427 }
8523533c
TK
428 spam_bar_buffer[i] = '\0';
429 spam_bar = spam_bar_buffer;
430
431 /* create "float" spam score */
b07e6aa3 432 (void)string_format(spam_score_buffer, sizeof(spam_score_buffer),"%.1f", spamd_score);
8523533c
TK
433 spam_score = spam_score_buffer;
434
435 /* create "int" spam score */
436 j = (int)((spamd_score + 0.001)*10);
b07e6aa3 437 (void)string_format(spam_score_int_buffer, sizeof(spam_score_int_buffer), "%d", j);
8523533c
TK
438 spam_score_int = spam_score_int_buffer;
439
440 /* compare threshold against score */
ddcf2b5f
JH
441 if (spamd_score >= spamd_threshold)
442 {
8523533c
TK
443 /* spam as determined by user's threshold */
444 spam_rc = OK;
ddcf2b5f
JH
445 }
446 else
447 {
8523533c
TK
448 /* not spam */
449 spam_rc = FAIL;
ddcf2b5f 450 }
8e669ac1 451
f7274286 452 /* remember expanded spamd_address if needed */
ddcf2b5f 453 if (spamd_address_work != spamd_address)
f7274286 454 prev_spamd_address_work = string_copy(spamd_address_work);
ddcf2b5f 455
f7274286
PP
456 /* remember user name and "been here" for it */
457 Ustrcpy(prev_user_name, user_name);
458 spam_ok = 1;
8e669ac1 459
ddcf2b5f 460 if (override) /* always return OK, no matter what the score */
8523533c 461 return OK;
ddcf2b5f 462 else
8523533c 463 return spam_rc;
8523533c
TK
464}
465
466#endif