Start
[exim.git] / src / src / transports / tf_maildir.c
CommitLineData
0756eb3c
PH
1/* $Cambridge: exim/src/src/transports/tf_maildir.c,v 1.1 2004/10/07 13:10:02 ph10 Exp $ */
2
3/*************************************************
4* Exim - an Internet mail transport agent *
5*************************************************/
6
7/* Copyright (c) University of Cambridge 1995 - 2004 */
8/* See the file NOTICE for conditions of use and distribution. */
9
10/* Functions in support of the use of maildirsize files for handling quotas in
11maildir directories. Some of the rules are a bit baroque:
12
13http://www.inter7.com/courierimap/README.maildirquota.html
14
15We try to follow most of that, except that the directories to skip for quota
16calculations are not hard wired in, but are supplied as a regex. */
17
18
19#include "../exim.h"
20#include "appendfile.h"
21#include "tf_maildir.h"
22
23#define MAX_FILE_SIZE 5120
24
25
26
27/*************************************************
28* Ensure maildir directories exist *
29*************************************************/
30
31/* This function is called at the start of a maildir delivery, to ensure that
32all the relevant directories exist.
33
34Argument:
35 path the base directory name
36 addr the address item (for setting an error message)
37 create_directory true if we are allowed to create missing directories
38 dirmode the mode for created directories
39
40Returns: TRUE on success; FALSE on failure
41*/
42
43BOOL maildir_ensure_directories(uschar *path, address_item *addr,
44 BOOL create_directory, int dirmode)
45{
46int i;
47struct stat statbuf;
48char *subdirs[] = { "/tmp", "/new", "/cur" };
49
50DEBUG(D_transport)
51 debug_printf("ensuring maildir directories exist in %s\n", path);
52
53/* First ensure that the path we have is a directory; if it does not exist,
54create it. Then make sure the tmp, new & cur subdirs of the maildir are
55there. If not, fail which aborts the delivery (even though the cur subdir is
56not actually needed for delivery). Handle all 4 directory tests/creates in a
57loop so that code can be shared. */
58
59for (i = 0; i < 4; i++)
60 {
61 int j;
62 uschar *dir, *mdir;
63
64 if (i == 0)
65 {
66 mdir = US"";
67 dir = path;
68 }
69 else
70 {
71 mdir = US subdirs[i-1];
72 dir = mdir + 1;
73 }
74
75 /* Check an existing path is a directory. This is inside a loop because
76 there is a potential race condition when creating the directory - some
77 other process may get there first. Give up after trying several times,
78 though. */
79
80 for (j = 0; j < 10; j++)
81 {
82 if (Ustat(dir, &statbuf) == 0)
83 {
84 if (S_ISDIR(statbuf.st_mode)) break; /* out of the race loop */
85 addr->message = string_sprintf("%s%s is not a directory", path,
86 mdir);
87 addr->basic_errno = ERRNO_NOTDIRECTORY;
88 return FALSE;
89 }
90
91 /* Try to make if non-existent and configured to do so */
92
93 if (errno == ENOENT && create_directory)
94 {
95 if (!directory_make(NULL, dir, dirmode, FALSE))
96 {
97 if (errno == EEXIST) continue; /* repeat the race loop */
98 addr->message = string_sprintf("cannot create %s%s", path, mdir);
99 addr->basic_errno = errno;
100 return FALSE;
101 }
102 DEBUG(D_transport)
103 debug_printf("created directory %s%s\n", path, mdir);
104 break; /* out of the race loop */
105 }
106
107 /* stat() error other than ENOENT, or ENOENT and not creatable */
108
109 addr->message = string_sprintf("stat() error for %s%s: %s", path, mdir,
110 strerror(errno));
111 addr->basic_errno = errno;
112 return FALSE;
113 }
114
115 /* If we went round the loop 10 times, the directory was flickering in
116 and out of existence like someone in a malfunctioning Star Trek
117 transporter. */
118
119 if (j >= 10)
120 {
121 addr->message = string_sprintf("existence of %s%s unclear\n", path,
122 mdir);
123 addr->basic_errno = errno;
124 addr->special_action = SPECIAL_FREEZE;
125 return FALSE;
126 }
127
128 /* First time through the directories loop, cd to the main directory */
129
130 if (i == 0 && Uchdir(path) != 0)
131 {
132 addr->message = string_sprintf ("cannot chdir to %s", path);
133 addr->basic_errno = errno;
134 return FALSE;
135 }
136 }
137
138return TRUE; /* All directories exist */
139}
140
141
142
143
144/*************************************************
145* Update maildirsizefile for new file *
146*************************************************/
147
148/* This function is called to add a new line to the file, recording the length
149of the newly added message. There isn't much we can do on failure...
150
151Arguments:
152 fd the open file descriptor
153 size the size of the message
154
155Returns: nothing
156*/
157
158void
159maildir_record_length(int fd, int size)
160{
161int len;
162uschar buffer[256];
163sprintf(CS buffer, "%d 1\n", size);
164len = Ustrlen(buffer);
165(void)lseek(fd, 0, SEEK_END);
166(void)write(fd, buffer, len);
167DEBUG(D_transport)
168 debug_printf("added '%.*s' to maildirsize file\n", len-1, buffer);
169}
170
171
172
173/*************************************************
174* Find the size of a maildir *
175*************************************************/
176
177/* This function is called when we have to recalculate the size of a maildir by
178scanning all the files and directories therein. There are rules and conventions
179about which files or directories are included. We support this by the use of a
180regex to match directories that are to be included.
181
182Maildirs can only be one level deep. However, this function recurses, so it
183might cope with deeper nestings. We use the existing check_dir_size() function
184to add up the sizes of the files in a directory that contains messages.
185
186The function returns the most recent timestamp encountered. It can also be run
187in a dummy mode in which it does not scan for sizes, but just returns the
188timestamp.
189
190Arguments:
191 path the path to the maildir
192 filecount where to store the count of messages
193 latest where to store the latest timestamp encountered
194 regex a regex for getting files sizes from file names
195 dir_regex a regex for matching directories to be included
196 timestamp_only don't actually compute any sizes
197
198Returns: the sum of the sizes of the messages
199*/
200
201int
202maildir_compute_size(uschar *path, int *filecount, time_t *latest,
203 const pcre *regex, const pcre *dir_regex, BOOL timestamp_only)
204{
205DIR *dir;
206int sum = 0;
207struct dirent *ent;
208struct stat statbuf;
209
210dir = opendir(CS path);
211if (dir == NULL) return 0;
212
213while ((ent = readdir(dir)) != NULL)
214 {
215 uschar *name = US ent->d_name;
216 uschar buffer[1024];
217
218 if (Ustrcmp(name, ".") == 0 || Ustrcmp(name, "..") == 0) continue;
219
220 /* We are normally supplied with a regex for choosing which directories to
221 scan. We do the regex match first, because that avoids a stat() for names
222 we aren't interested in. */
223
224 if (dir_regex != NULL &&
225 pcre_exec(dir_regex, NULL, CS name, Ustrlen(name), 0, 0, NULL, 0) < 0)
226 {
227 DEBUG(D_transport)
228 debug_printf("skipping %s/%s: dir_regex does not match\n", path, name);
229 continue;
230 }
231
232 /* The name is OK; stat it. */
233
234 if (!string_format(buffer, sizeof(buffer), "%s/%s", path, name))
235 {
236 DEBUG(D_transport)
237 debug_printf("maildir_compute_size: name too long: dir=%s name=%s\n",
238 path, name);
239 continue;
240 }
241
242 if (Ustat(buffer, &statbuf) < 0)
243 {
244 DEBUG(D_transport)
245 debug_printf("maildir_compute_size: stat error %d for %s: %s\n", errno,
246 buffer, strerror(errno));
247 continue;
248 }
249
250 if ((statbuf.st_mode & S_IFMT) != S_IFDIR)
251 {
252 DEBUG(D_transport)
253 debug_printf("skipping %s/%s: not a directory\n", path, name);
254 continue;
255 }
256
257 /* Keep the latest timestamp encountered */
258
259 if (statbuf.st_mtime > *latest) *latest = statbuf.st_mtime;
260
261 /* If this is a maildir folder, call this function recursively. */
262
263 if (name[0] == '.')
264 {
265 sum += maildir_compute_size(buffer, filecount, latest, regex, dir_regex,
266 timestamp_only);
267 }
268
269 /* Otherwise it must be a folder that contains messages (e.g. new or cur), so
270 we need to get its size, unless all we are interested in is the timestamp. */
271
272 else if (!timestamp_only)
273 {
274 sum += check_dir_size(buffer, filecount, regex);
275 }
276 }
277
278closedir(dir);
279DEBUG(D_transport)
280 {
281 if (timestamp_only)
282 debug_printf("maildir_compute_size (timestamp_only): %ld\n",
283 (long int) *latest);
284 else
285 debug_printf("maildir_compute_size: path=%s\n sum=%d filecount=%d "
286 "timestamp=%ld\n", path, sum, *filecount, (long int) *latest);
287 }
288return sum;
289}
290
291
292
293/*************************************************
294* Create or update maildirsizefile *
295*************************************************/
296
297/* This function is called before a delivery if the option to use
298maildirsizefile is enabled. Its function is to create the file if it does not
299exist, or to update it if that is necessary.
300
301The logic in this function follows the rules that are described in
302
303 http://www.inter7.com/courierimap/README.maildirquota.html
304
305Or, at least, it is supposed to!
306
307Arguments:
308 path the path to the maildir directory; this is already backed-up
309 to the parent if the delivery diretory is a maildirfolder
310 ob the appendfile options block
311 regex a compiled regex for getting a file's size from its name
312 dir_regex a compiled regex for selecting maildir directories
313 returned_size where to return the current size of the maildir, even if
314 the maildirsizefile is removed because of a race
315
316Returns: >=0 a file descriptor for an open maildirsize file
317 -1 there was an error opening or accessing the file
318 -2 the file was removed because of a race
319*/
320
321int
322maildir_ensure_sizefile(uschar *path, appendfile_transport_options_block *ob,
323 const pcre *regex, const pcre *dir_regex, int *returned_size,
324 int *returned_filecount)
325{
326int count, fd;
327int cached_quota = 0;
328int cached_quota_filecount = 0;
329int size = 0;
330int filecount = 0;
331int linecount = 0;
332uschar *filename;
333uschar buffer[MAX_FILE_SIZE];
334uschar *ptr = buffer;
335uschar *endptr;
336
337/* Try a few times to open or create the file, in case another process is doing
338the same thing. */
339
340filename = string_sprintf("%s/maildirsize", path);
341
342DEBUG(D_transport) debug_printf("looking for maildirsize in %s\n", path);
343fd = Uopen(filename, O_RDWR|O_APPEND, 0);
344if (fd < 0)
345 {
346 if (errno != ENOENT) return -1;
347 DEBUG(D_transport)
348 debug_printf("%s does not exist: recalculating\n", filename);
349 goto RECALCULATE;
350 }
351
352/* The file has been successfully opened. Check that the cached quota value is
353still correct, and that the size of the file is still small enough. If so,
354compute the maildir size from the file. */
355
356count = read(fd, buffer, sizeof(buffer));
357if (count >= sizeof(buffer))
358 {
359 DEBUG(D_transport)
360 debug_printf("maildirsize file too big (%d): recalculating\n", count);
361 goto RECALCULATE;
362 }
363buffer[count] = 0; /* Ensure string terminated */
364
365/* Read the quota parameters from the first line of the data. */
366
367DEBUG(D_transport)
368 debug_printf("reading quota parameters from maildirsize data\n");
369
370for (;;)
371 {
372 long int n = Ustrtol(ptr, &endptr, 10);
373
374 /* Only two data items are currently defined; ignore any others that
375 may be present. The spec is for a number followed by a letter. Anything
376 else we reject and recalculate. */
377
378 if (*endptr == 'S') cached_quota = n;
379 else if (*endptr == 'C') cached_quota_filecount = n;
380 if (!isalpha(*endptr++))
381 {
382 DEBUG(D_transport)
383 debug_printf("quota parameter number not followed by letter in "
384 "\"%.*s\": recalculating maildirsize\n", (int)(endptr - buffer),
385 buffer);
386 goto RECALCULATE;
387 }
388 if (*endptr == '\n' || *endptr == 0) break;
389 if (*endptr++ != ',')
390 {
391 DEBUG(D_transport)
392 debug_printf("quota parameter not followed by comma in "
393 "\"%.*s\": recalculating maildirsize\n", (int)(endptr - buffer),
394 buffer);
395 goto RECALCULATE;
396 }
397 ptr = endptr;
398 }
399
400/* Check the cached values against the current settings */
401
402if (cached_quota != ob->quota_value ||
403 cached_quota_filecount != ob->quota_filecount_value)
404 {
405 DEBUG(D_transport)
406 debug_printf("cached quota is out of date: recalculating\n"
407 " quota=%d cached_quota=%d filecount_quota=%d "
408 "cached_quota_filecount=%d\n", ob->quota_value, cached_quota,
409 ob->quota_filecount_value, cached_quota_filecount);
410 goto RECALCULATE;
411 }
412
413/* Quota values agree; parse the rest of the data to get the sizes. At this
414stage, *endptr points either to 0 or to '\n'. */
415
416DEBUG(D_transport)
417 debug_printf("computing maildir size from maildirsize data\n");
418
419while (*endptr++ == '\n')
420 {
421 if (*endptr == 0) break;
422 linecount++;
423 ptr = endptr;
424 size += Ustrtol(ptr, &endptr, 10);
425 if (*endptr != ' ') break;
426 ptr = endptr + 1;
427 filecount += Ustrtol(ptr, &endptr, 10);
428 }
429
430/* If *endptr is zero, we have successfully parsed the file, and we now have
431the size of the mailbox as cached in the file. The "rules" say that if this
432value indicates that the mailbox is over quota, we must recalculate if there is
433more than one entry in the file, or if the file is older than 15 minutes. */
434
435if (*endptr == 0)
436 {
437 if (ob->quota_value > 0 &&
438 (size + (ob->quota_is_inclusive? message_size : 0) > ob->quota_value ||
439 (ob->quota_filecount_value > 0 &&
440 filecount + (ob->quota_is_inclusive ? 1:0) >
441 ob->quota_filecount_value)
442 ))
443 {
444 struct stat statbuf;
445 if (linecount > 1)
446 {
447 DEBUG(D_transport) debug_printf("over quota and maildirsizefile has "
448 "more than 1 entry: recalculating\n");
449 goto RECALCULATE;
450 }
451
452 if (fstat(fd, &statbuf) < 0) goto RECALCULATE; /* Should never occur */
453
454 if (time(NULL) - statbuf.st_mtime > 15*60)
455 {
456 DEBUG(D_transport) debug_printf("over quota and maildirsize is older "
457 "than 15 minutes: recalculating\n");
458 goto RECALCULATE;
459 }
460 }
461 }
462
463
464/* If *endptr is not zero, there was a syntax error in the file. */
465
466else
467 {
468 int len;
469 time_t old_latest, new_latest;
470 uschar *tempname;
471 struct timeval tv;
472
473 DEBUG(D_transport)
474 {
475 uschar *p = endptr;
476 while (p > buffer && p[-1] != '\n') p--;
477 endptr[1] = 0;
478
479 debug_printf("error in maildirsizefile: unexpected character %d in "
480 "line %d (starting '%s'): recalculating\n",
481 *endptr, linecount + 1, string_printing(p));
482 }
483
484 /* Either there is no file, or the quota value has changed, or the file has
485 got too big, or there was some format error in the file. Recalculate the size
486 and write new contents to a temporary file; then rename it. After any
487 error, just return -1 as the file descriptor. */
488
489 RECALCULATE:
490
491 if (fd >= 0) close(fd);
492 old_latest = 0;
493 filecount = 0;
494 size = maildir_compute_size(path, &filecount, &old_latest, regex, dir_regex,
495 FALSE);
496
497 (void)gettimeofday(&tv, NULL);
498 tempname = string_sprintf("%s/tmp/%lu.H%luP%lu.%s", path, tv.tv_sec,
499 tv.tv_usec, getpid(), primary_hostname);
500
501 fd = Uopen(tempname, O_RDWR|O_CREAT|O_EXCL, 0600);
502 if (fd >= 0)
503 {
504 (void)sprintf(CS buffer, "%dS,%dC\n%d %d\n", ob->quota_value,
505 ob->quota_filecount_value, size, filecount);
506 len = Ustrlen(buffer);
507 if (write(fd, buffer, len) != len || Urename(tempname, filename) < 0)
508 {
509 close(fd);
510 fd = -1;
511 }
512 }
513
514 /* If any of the directories have been modified since the last timestamp we
515 saw, we have to junk this maildirsize file. */
516
517 DEBUG(D_transport) debug_printf("checking subdirectory timestamps\n");
518 new_latest = 0;
519 (void)maildir_compute_size(path, NULL, &new_latest , NULL, dir_regex, TRUE);
520 if (new_latest > old_latest)
521 {
522 DEBUG(D_transport) debug_printf("abandoning maildirsize because of "
523 "a later subdirectory modification\n");
524 (void)Uunlink(filename);
525 close(fd);
526 fd = -1;
527 }
528 }
529
530/* Return the sizes and the file descriptor, if any */
531
532DEBUG(D_transport) debug_printf("returning maildir size=%d filecount=%d\n",
533 size, filecount);
534*returned_size = size;
535*returned_filecount = filecount;
536return fd;
537}
538
539/* End of tf_maildir.c */