Testsuite: output changes resulting
[exim.git] / src / src / string.c
CommitLineData
059ec3d9
PH
1/*************************************************
2* Exim - an Internet mail transport agent *
3*************************************************/
4
f9ba5e22 5/* Copyright (c) University of Cambridge 1995 - 2018 */
059ec3d9
PH
6/* See the file NOTICE for conditions of use and distribution. */
7
8/* Miscellaneous string-handling functions. Some are not required for
9utilities and tests, and are cut out by the COMPILE_UTILITY macro. */
10
11
12#include "exim.h"
d12746bc 13#include <assert.h>
059ec3d9
PH
14
15
16#ifndef COMPILE_UTILITY
17/*************************************************
18* Test for IP address *
19*************************************************/
20
21/* This used just to be a regular expression, but with IPv6 things are a bit
22more complicated. If the address contains a colon, it is assumed to be a v6
23address (assuming HAVE_IPV6 is set). If a mask is permitted and one is present,
24and maskptr is not NULL, its offset is placed there.
25
26Arguments:
27 s a string
28 maskptr NULL if no mask is permitted to follow
29 otherwise, points to an int where the offset of '/' is placed
1688f43b 30 if there is no / followed by trailing digits, *maskptr is set 0
059ec3d9
PH
31
32Returns: 0 if the string is not a textual representation of an IP address
33 4 if it is an IPv4 address
34 6 if it is an IPv6 address
35*/
36
37int
b1f8e4f8 38string_is_ip_address(const uschar *s, int *maskptr)
059ec3d9 39{
059ec3d9
PH
40int yield = 4;
41
42/* If an optional mask is permitted, check for it. If found, pass back the
43offset. */
44
8d909960 45if (maskptr)
059ec3d9 46 {
b1f8e4f8 47 const uschar *ss = s + Ustrlen(s);
059ec3d9
PH
48 *maskptr = 0;
49 if (s != ss && isdigit(*(--ss)))
50 {
51 while (ss > s && isdigit(ss[-1])) ss--;
52 if (ss > s && *(--ss) == '/') *maskptr = ss - s;
53 }
54 }
55
56/* A colon anywhere in the string => IPv6 address */
57
58if (Ustrchr(s, ':') != NULL)
59 {
60 BOOL had_double_colon = FALSE;
61 BOOL v4end = FALSE;
059ec3d9
PH
62
63 yield = 6;
64
65 /* An IPv6 address must start with hex digit or double colon. A single
66 colon is invalid. */
67
68 if (*s == ':' && *(++s) != ':') return 0;
69
70 /* Now read up to 8 components consisting of up to 4 hex digits each. There
71 may be one and only one appearance of double colon, which implies any number
72 of binary zero bits. The number of preceding components is held in count. */
73
d7978c0f 74 for (int count = 0; count < 8; count++)
059ec3d9
PH
75 {
76 /* If the end of the string is reached before reading 8 components, the
77 address is valid provided a double colon has been read. This also applies
78 if we hit the / that introduces a mask or the % that introduces the
79 interface specifier (scope id) of a link-local address. */
80
8d909960 81 if (*s == 0 || *s == '%' || *s == '/') return had_double_colon ? yield : 0;
059ec3d9
PH
82
83 /* If a component starts with an additional colon, we have hit a double
84 colon. This is permitted to appear once only, and counts as at least
85 one component. The final component may be of this form. */
86
87 if (*s == ':')
88 {
89 if (had_double_colon) return 0;
90 had_double_colon = TRUE;
91 s++;
92 continue;
93 }
94
95 /* If the remainder of the string contains a dot but no colons, we
96 can expect a trailing IPv4 address. This is valid if either there has
97 been no double-colon and this is the 7th component (with the IPv4 address
98 being the 7th & 8th components), OR if there has been a double-colon
99 and fewer than 6 components. */
100
101 if (Ustrchr(s, ':') == NULL && Ustrchr(s, '.') != NULL)
102 {
103 if ((!had_double_colon && count != 6) ||
104 (had_double_colon && count > 6)) return 0;
105 v4end = TRUE;
106 yield = 6;
107 break;
108 }
109
110 /* Check for at least one and not more than 4 hex digits for this
111 component. */
112
113 if (!isxdigit(*s++)) return 0;
114 if (isxdigit(*s) && isxdigit(*(++s)) && isxdigit(*(++s))) s++;
115
116 /* If the component is terminated by colon and there is more to
117 follow, skip over the colon. If there is no more to follow the address is
118 invalid. */
119
120 if (*s == ':' && *(++s) == 0) return 0;
121 }
122
123 /* If about to handle a trailing IPv4 address, drop through. Otherwise
124 all is well if we are at the end of the string or at the mask or at a percent
125 sign, which introduces the interface specifier (scope id) of a link local
126 address. */
127
1688f43b
PH
128 if (!v4end)
129 return (*s == 0 || *s == '%' ||
130 (*s == '/' && maskptr != NULL && *maskptr != 0))? yield : 0;
059ec3d9
PH
131 }
132
133/* Test for IPv4 address, which may be the tail-end of an IPv6 address. */
134
d7978c0f 135for (int i = 0; i < 4; i++)
059ec3d9 136 {
8d909960
JH
137 long n;
138 uschar * end;
139
059ec3d9 140 if (i != 0 && *s++ != '.') return 0;
8d909960
JH
141 n = strtol(CCS s, CSS &end, 10);
142 if (n > 255 || n < 0 || end <= s || end > s+3) return 0;
143 s = end;
059ec3d9
PH
144 }
145
8d909960 146return !*s || (*s == '/' && maskptr && *maskptr != 0) ? yield : 0;
059ec3d9
PH
147}
148#endif /* COMPILE_UTILITY */
149
150
151/*************************************************
152* Format message size *
153*************************************************/
154
155/* Convert a message size in bytes to printing form, rounding
156according to the magnitude of the number. A value of zero causes
157a string of spaces to be returned.
158
159Arguments:
160 size the message size in bytes
161 buffer where to put the answer
162
163Returns: pointer to the buffer
164 a string of exactly 5 characters is normally returned
165*/
166
167uschar *
168string_format_size(int size, uschar *buffer)
169{
f3ebb786 170if (size == 0) Ustrcpy(buffer, US" ");
059ec3d9
PH
171else if (size < 1024) sprintf(CS buffer, "%5d", size);
172else if (size < 10*1024)
173 sprintf(CS buffer, "%4.1fK", (double)size / 1024.0);
174else if (size < 1024*1024)
175 sprintf(CS buffer, "%4dK", (size + 512)/1024);
176else if (size < 10*1024*1024)
177 sprintf(CS buffer, "%4.1fM", (double)size / (1024.0 * 1024.0));
178else
179 sprintf(CS buffer, "%4dM", (size + 512 * 1024)/(1024*1024));
180return buffer;
181}
182
183
184
185#ifndef COMPILE_UTILITY
186/*************************************************
187* Convert a number to base 62 format *
188*************************************************/
189
190/* Convert a long integer into an ASCII base 62 string. For Cygwin the value of
191BASE_62 is actually 36. Always return exactly 6 characters plus zero, in a
192static area.
193
194Argument: a long integer
195Returns: pointer to base 62 string
196*/
197
198uschar *
199string_base62(unsigned long int value)
200{
201static uschar yield[7];
202uschar *p = yield + sizeof(yield) - 1;
203*p = 0;
204while (p > yield)
205 {
206 *(--p) = base62_chars[value % BASE_62];
207 value /= BASE_62;
208 }
209return yield;
210}
211#endif /* COMPILE_UTILITY */
212
213
214
059ec3d9
PH
215/*************************************************
216* Interpret escape sequence *
217*************************************************/
218
219/* This function is called from several places where escape sequences are to be
220interpreted in strings.
221
222Arguments:
223 pp points a pointer to the initiating "\" in the string;
224 the pointer gets updated to point to the final character
c3aefacc
HSHR
225 If the backslash is the last character in the string, it
226 is not interpreted.
059ec3d9
PH
227Returns: the value of the character escape
228*/
229
230int
55414b25 231string_interpret_escape(const uschar **pp)
059ec3d9 232{
3fb3c68d
JH
233#ifdef COMPILE_UTILITY
234const uschar *hex_digits= CUS"0123456789abcdef";
235#endif
059ec3d9 236int ch;
55414b25 237const uschar *p = *pp;
059ec3d9 238ch = *(++p);
c3aefacc 239if (ch == '\0') return **pp;
059ec3d9
PH
240if (isdigit(ch) && ch != '8' && ch != '9')
241 {
242 ch -= '0';
243 if (isdigit(p[1]) && p[1] != '8' && p[1] != '9')
244 {
245 ch = ch * 8 + *(++p) - '0';
246 if (isdigit(p[1]) && p[1] != '8' && p[1] != '9')
247 ch = ch * 8 + *(++p) - '0';
248 }
249 }
250else switch(ch)
251 {
c7396ac5
PP
252 case 'b': ch = '\b'; break;
253 case 'f': ch = '\f'; break;
059ec3d9
PH
254 case 'n': ch = '\n'; break;
255 case 'r': ch = '\r'; break;
256 case 't': ch = '\t'; break;
c7396ac5 257 case 'v': ch = '\v'; break;
059ec3d9
PH
258 case 'x':
259 ch = 0;
260 if (isxdigit(p[1]))
261 {
262 ch = ch * 16 +
263 Ustrchr(hex_digits, tolower(*(++p))) - hex_digits;
264 if (isxdigit(p[1])) ch = ch * 16 +
265 Ustrchr(hex_digits, tolower(*(++p))) - hex_digits;
266 }
267 break;
268 }
269*pp = p;
270return ch;
271}
059ec3d9
PH
272
273
274
275#ifndef COMPILE_UTILITY
276/*************************************************
277* Ensure string is printable *
278*************************************************/
279
280/* This function is called for critical strings. It checks for any
281non-printing characters, and if any are found, it makes a new copy
282of the string with suitable escape sequences. It is most often called by the
283macro string_printing(), which sets allow_tab TRUE.
284
285Arguments:
286 s the input string
287 allow_tab TRUE to allow tab as a printing character
288
289Returns: string with non-printers encoded as printing sequences
290*/
291
55414b25
JH
292const uschar *
293string_printing2(const uschar *s, BOOL allow_tab)
059ec3d9
PH
294{
295int nonprintcount = 0;
296int length = 0;
55414b25 297const uschar *t = s;
059ec3d9
PH
298uschar *ss, *tt;
299
300while (*t != 0)
301 {
302 int c = *t++;
303 if (!mac_isprint(c) || (!allow_tab && c == '\t')) nonprintcount++;
304 length++;
305 }
306
307if (nonprintcount == 0) return s;
308
309/* Get a new block of store guaranteed big enough to hold the
310expanded string. */
311
f3ebb786 312ss = store_get(length + nonprintcount * 3 + 1, is_tainted(s));
059ec3d9 313
4c04137d 314/* Copy everything, escaping non printers. */
059ec3d9
PH
315
316t = s;
317tt = ss;
318
319while (*t != 0)
320 {
321 int c = *t;
322 if (mac_isprint(c) && (allow_tab || c != '\t')) *tt++ = *t++; else
323 {
324 *tt++ = '\\';
325 switch (*t)
326 {
327 case '\n': *tt++ = 'n'; break;
328 case '\r': *tt++ = 'r'; break;
329 case '\b': *tt++ = 'b'; break;
330 case '\v': *tt++ = 'v'; break;
331 case '\f': *tt++ = 'f'; break;
332 case '\t': *tt++ = 't'; break;
333 default: sprintf(CS tt, "%03o", *t); tt += 3; break;
334 }
335 t++;
336 }
337 }
338*tt = 0;
c7396ac5
PP
339return ss;
340}
79fe97d8
PP
341#endif /* COMPILE_UTILITY */
342
c7396ac5
PP
343/*************************************************
344* Undo printing escapes in string *
345*************************************************/
346
347/* This function is the reverse of string_printing2. It searches for
348backslash characters and if any are found, it makes a new copy of the
349string with escape sequences parsed. Otherwise it returns the original
350string.
351
352Arguments:
353 s the input string
354
355Returns: string with printing escapes parsed back
356*/
357
358uschar *
359string_unprinting(uschar *s)
360{
361uschar *p, *q, *r, *ss;
362int len, off;
363
364p = Ustrchr(s, '\\');
365if (!p) return s;
366
367len = Ustrlen(s) + 1;
f3ebb786 368ss = store_get(len, is_tainted(s));
c7396ac5
PP
369
370q = ss;
371off = p - s;
372if (off)
373 {
374 memcpy(q, s, off);
375 q += off;
376 }
377
378while (*p)
379 {
380 if (*p == '\\')
381 {
55414b25 382 *q++ = string_interpret_escape((const uschar **)&p);
823ad74f 383 p++;
c7396ac5
PP
384 }
385 else
386 {
387 r = Ustrchr(p, '\\');
388 if (!r)
389 {
390 off = Ustrlen(p);
391 memcpy(q, p, off);
392 p += off;
393 q += off;
394 break;
395 }
396 else
397 {
398 off = r - p;
399 memcpy(q, p, off);
400 q += off;
401 p = r;
402 }
403 }
404 }
405*q = '\0';
406
059ec3d9
PH
407return ss;
408}
059ec3d9
PH
409
410
411
412
bf13aee1
JH
413#if (defined(HAVE_LOCAL_SCAN) || defined(EXPAND_DLFUNC)) \
414 && !defined(MACRO_PREDEF) && !defined(COMPILE_UTILITY)
059ec3d9
PH
415/*************************************************
416* Copy and save string *
417*************************************************/
418
f3ebb786 419/*
059ec3d9 420Argument: string to copy
f3ebb786 421Returns: copy of string in new store with the same taint status
059ec3d9
PH
422*/
423
424uschar *
e59797e3 425string_copy_function(const uschar *s)
059ec3d9 426{
f3ebb786
JH
427return string_copy_taint(s, is_tainted(s));
428}
429
430/* This function assumes that memcpy() is faster than strcpy().
431As above, but explicitly specifying the result taint status
432*/
433
434uschar *
d48326c0 435string_copy_taint_function(const uschar * s, BOOL tainted)
f3ebb786 436{
059ec3d9 437int len = Ustrlen(s) + 1;
f3ebb786 438uschar *ss = store_get(len, tainted);
059ec3d9
PH
439memcpy(ss, s, len);
440return ss;
441}
442
443
f3ebb786 444
059ec3d9
PH
445/*************************************************
446* Copy and save string, given length *
447*************************************************/
448
449/* It is assumed the data contains no zeros. A zero is added
450onto the end.
451
452Arguments:
453 s string to copy
454 n number of characters
455
456Returns: copy of string in new store
457*/
458
459uschar *
e59797e3 460string_copyn_function(const uschar *s, int n)
059ec3d9 461{
f3ebb786 462uschar *ss = store_get(n + 1, is_tainted(s));
059ec3d9
PH
463Ustrncpy(ss, s, n);
464ss[n] = 0;
465return ss;
466}
e59797e3 467#endif
059ec3d9
PH
468
469
470/*************************************************
e59797e3 471* Copy and save string in malloc'd store *
059ec3d9
PH
472*************************************************/
473
e59797e3 474/* This function assumes that memcpy() is faster than strcpy().
059ec3d9 475
e59797e3
JH
476Argument: string to copy
477Returns: copy of string in new store
059ec3d9
PH
478*/
479
480uschar *
e59797e3 481string_copy_malloc(const uschar *s)
059ec3d9 482{
e59797e3
JH
483int len = Ustrlen(s) + 1;
484uschar *ss = store_malloc(len);
485memcpy(ss, s, len);
059ec3d9
PH
486return ss;
487}
488
489
490
e28326d8
PH
491/*************************************************
492* Copy string if long, inserting newlines *
493*************************************************/
494
495/* If the given string is longer than 75 characters, it is copied, and within
496the copy, certain space characters are converted into newlines.
497
498Argument: pointer to the string
499Returns: pointer to the possibly altered string
500*/
501
502uschar *
503string_split_message(uschar *msg)
504{
505uschar *s, *ss;
506
507if (msg == NULL || Ustrlen(msg) <= 75) return msg;
508s = ss = msg = string_copy(msg);
509
510for (;;)
511 {
512 int i = 0;
513 while (i < 75 && *ss != 0 && *ss != '\n') ss++, i++;
514 if (*ss == 0) break;
515 if (*ss == '\n')
516 s = ++ss;
517 else
518 {
519 uschar *t = ss + 1;
520 uschar *tt = NULL;
521 while (--t > s + 35)
522 {
523 if (*t == ' ')
524 {
525 if (t[-1] == ':') { tt = t; break; }
526 if (tt == NULL) tt = t;
527 }
528 }
529
530 if (tt == NULL) /* Can't split behind - try ahead */
531 {
532 t = ss + 1;
533 while (*t != 0)
534 {
535 if (*t == ' ' || *t == '\n')
536 { tt = t; break; }
537 t++;
538 }
539 }
540
541 if (tt == NULL) break; /* Can't find anywhere to split */
542 *tt = '\n';
543 s = ss = tt+1;
544 }
545 }
546
547return msg;
548}
549
550
551
059ec3d9
PH
552/*************************************************
553* Copy returned DNS domain name, de-escaping *
554*************************************************/
555
556/* If a domain name contains top-bit characters, some resolvers return
557the fully qualified name with those characters turned into escapes. The
558convention is a backslash followed by _decimal_ digits. We convert these
559back into the original binary values. This will be relevant when
560allow_utf8_domains is set true and UTF-8 characters are used in domain
561names. Backslash can also be used to escape other characters, though we
562shouldn't come across them in domain names.
563
564Argument: the domain name string
565Returns: copy of string in new store, de-escaped
566*/
567
568uschar *
569string_copy_dnsdomain(uschar *s)
570{
571uschar *yield;
f3ebb786 572uschar *ss = yield = store_get(Ustrlen(s) + 1, is_tainted(s));
059ec3d9
PH
573
574while (*s != 0)
575 {
576 if (*s != '\\')
059ec3d9 577 *ss++ = *s++;
059ec3d9
PH
578 else if (isdigit(s[1]))
579 {
580 *ss++ = (s[1] - '0')*100 + (s[2] - '0')*10 + s[3] - '0';
581 s += 4;
582 }
583 else if (*(++s) != 0)
059ec3d9 584 *ss++ = *s++;
059ec3d9
PH
585 }
586
587*ss = 0;
588return yield;
589}
590
591
592#ifndef COMPILE_UTILITY
593/*************************************************
594* Copy space-terminated or quoted string *
595*************************************************/
596
597/* This function copies from a string until its end, or until whitespace is
598encountered, unless the string begins with a double quote, in which case the
599terminating quote is sought, and escaping within the string is done. The length
600of a de-quoted string can be no longer than the original, since escaping always
601turns n characters into 1 character.
602
603Argument: pointer to the pointer to the first character, which gets updated
604Returns: the new string
605*/
606
607uschar *
55414b25 608string_dequote(const uschar **sptr)
059ec3d9 609{
55414b25 610const uschar *s = *sptr;
059ec3d9
PH
611uschar *t, *yield;
612
613/* First find the end of the string */
614
615if (*s != '\"')
059ec3d9 616 while (*s != 0 && !isspace(*s)) s++;
059ec3d9
PH
617else
618 {
619 s++;
8c513105 620 while (*s && *s != '\"')
059ec3d9
PH
621 {
622 if (*s == '\\') (void)string_interpret_escape(&s);
623 s++;
624 }
8c513105 625 if (*s) s++;
059ec3d9
PH
626 }
627
628/* Get enough store to copy into */
629
f3ebb786 630t = yield = store_get(s - *sptr + 1, is_tainted(*sptr));
059ec3d9
PH
631s = *sptr;
632
633/* Do the copy */
634
635if (*s != '\"')
059ec3d9 636 while (*s != 0 && !isspace(*s)) *t++ = *s++;
059ec3d9
PH
637else
638 {
639 s++;
640 while (*s != 0 && *s != '\"')
641 {
f3ebb786 642 *t++ = *s == '\\' ? string_interpret_escape(&s) : *s;
059ec3d9
PH
643 s++;
644 }
f3ebb786 645 if (*s) s++;
059ec3d9
PH
646 }
647
648/* Update the pointer and return the terminated copy */
649
650*sptr = s;
651*t = 0;
652return yield;
653}
654#endif /* COMPILE_UTILITY */
655
656
657
658/*************************************************
659* Format a string and save it *
660*************************************************/
661
94759fce 662/* The formatting is done by string_vformat, which checks the length of
13e70f55 663everything. Taint is taken from the worst of the arguments.
059ec3d9
PH
664
665Arguments:
666 format a printf() format - deliberately char * rather than uschar *
667 because it will most usually be a literal string
668 ... arguments for format
669
670Returns: pointer to fresh piece of store containing sprintf'ed string
671*/
672
673uschar *
f3ebb786 674string_sprintf_trc(const char *format, const uschar * func, unsigned line, ...)
059ec3d9 675{
8aa16eb7
JH
676#ifdef COMPILE_UTILITY
677uschar buffer[STRING_SPRINTF_BUFFER_SIZE];
678gstring gs = { .size = STRING_SPRINTF_BUFFER_SIZE, .ptr = 0, .s = buffer };
679gstring * g = &gs;
680unsigned flags = 0;
681#else
682gstring * g = NULL;
683unsigned flags = SVFMT_REBUFFER|SVFMT_EXTEND;
684#endif
d12746bc 685
8aa16eb7 686va_list ap;
f3ebb786 687va_start(ap, line);
8aa16eb7
JH
688g = string_vformat_trc(g, func, line, STRING_SPRINTF_BUFFER_SIZE,
689 flags, format, ap);
059ec3d9 690va_end(ap);
d12746bc 691
f3ebb786 692if (!g)
d12746bc
JH
693 log_write(0, LOG_MAIN|LOG_PANIC_DIE,
694 "string_sprintf expansion was longer than %d; format string was (%s)\n"
f3ebb786
JH
695 " called from %s %d\n",
696 STRING_SPRINTF_BUFFER_SIZE, format, func, line);
d12746bc 697
8aa16eb7
JH
698#ifdef COMPILE_UTILITY
699return string_copyn(g->s, g->ptr);
700#else
f3ebb786
JH
701gstring_release_unused(g);
702return string_from_gstring(g);
8aa16eb7 703#endif
059ec3d9
PH
704}
705
706
707
708/*************************************************
709* Case-independent strncmp() function *
710*************************************************/
711
712/*
713Arguments:
714 s first string
715 t second string
716 n number of characters to compare
717
718Returns: < 0, = 0, or > 0, according to the comparison
719*/
720
721int
1ba28e2b 722strncmpic(const uschar *s, const uschar *t, int n)
059ec3d9
PH
723{
724while (n--)
725 {
726 int c = tolower(*s++) - tolower(*t++);
727 if (c) return c;
728 }
729return 0;
730}
731
732
733/*************************************************
734* Case-independent strcmp() function *
735*************************************************/
736
737/*
738Arguments:
739 s first string
740 t second string
741
742Returns: < 0, = 0, or > 0, according to the comparison
743*/
744
745int
1ba28e2b 746strcmpic(const uschar *s, const uschar *t)
059ec3d9
PH
747{
748while (*s != 0)
749 {
750 int c = tolower(*s++) - tolower(*t++);
751 if (c != 0) return c;
752 }
753return *t;
754}
755
756
757/*************************************************
758* Case-independent strstr() function *
759*************************************************/
760
761/* The third argument specifies whether whitespace is required
762to follow the matched string.
763
764Arguments:
765 s string to search
766 t substring to search for
767 space_follows if TRUE, match only if whitespace follows
768
769Returns: pointer to substring in string, or NULL if not found
770*/
771
772uschar *
773strstric(uschar *s, uschar *t, BOOL space_follows)
774{
775uschar *p = t;
776uschar *yield = NULL;
777int cl = tolower(*p);
778int cu = toupper(*p);
779
780while (*s)
781 {
782 if (*s == cl || *s == cu)
783 {
784 if (yield == NULL) yield = s;
785 if (*(++p) == 0)
786 {
787 if (!space_follows || s[1] == ' ' || s[1] == '\n' ) return yield;
788 yield = NULL;
789 p = t;
790 }
791 cl = tolower(*p);
792 cu = toupper(*p);
793 s++;
794 }
795 else if (yield != NULL)
796 {
797 yield = NULL;
798 p = t;
799 cl = tolower(*p);
800 cu = toupper(*p);
801 }
802 else s++;
803 }
804return NULL;
805}
806
807
808
d12746bc
JH
809#ifdef COMPILE_UTILITY
810/* Dummy version for this function; it should never be called */
811static void
f3ebb786 812gstring_grow(gstring * g, int count)
d12746bc
JH
813{
814assert(FALSE);
815}
816#endif
817
818
819
059ec3d9
PH
820#ifndef COMPILE_UTILITY
821/*************************************************
822* Get next string from separated list *
823*************************************************/
824
825/* Leading and trailing space is removed from each item. The separator in the
826list is controlled by the int pointed to by the separator argument as follows:
827
ec95d1a6
PH
828 If the value is > 0 it is used as the separator. This is typically used for
829 sublists such as slash-separated options. The value is always a printing
830 character.
831
832 (If the value is actually > UCHAR_MAX there is only one item in the list.
059ec3d9
PH
833 This is used for some cases when called via functions that sometimes
834 plough through lists, and sometimes are given single items.)
059ec3d9 835
ec95d1a6
PH
836 If the value is <= 0, the string is inspected for a leading <x, where x is an
837 ispunct() or an iscntrl() character. If found, x is used as the separator. If
838 not found:
839
840 (a) if separator == 0, ':' is used
841 (b) if separator <0, -separator is used
842
843 In all cases the value of the separator that is used is written back to the
844 int so that it is used on subsequent calls as we progress through the list.
845
846A literal ispunct() separator can be represented in an item by doubling, but
847there is no way to include an iscntrl() separator as part of the data.
059ec3d9
PH
848
849Arguments:
850 listptr points to a pointer to the current start of the list; the
851 pointer gets updated to point after the end of the next item
852 separator a pointer to the separator character in an int (see above)
853 buffer where to put a copy of the next string in the list; or
854 NULL if the next string is returned in new memory
855 buflen when buffer is not NULL, the size of buffer; otherwise ignored
856
857Returns: pointer to buffer, containing the next substring,
858 or NULL if no more substrings
859*/
860
861uschar *
ba74fb8d
JH
862string_nextinlist_trc(const uschar **listptr, int *separator, uschar *buffer, int buflen,
863 const uschar * func, int line)
059ec3d9 864{
55414b25
JH
865int sep = *separator;
866const uschar *s = *listptr;
ec95d1a6 867BOOL sep_is_special;
059ec3d9 868
8b455685 869if (!s) return NULL;
ec95d1a6
PH
870
871/* This allows for a fixed specified separator to be an iscntrl() character,
872but at the time of implementation, this is never the case. However, it's best
873to be conservative. */
874
875while (isspace(*s) && *s != sep) s++;
876
877/* A change of separator is permitted, so look for a leading '<' followed by an
878allowed character. */
059ec3d9
PH
879
880if (sep <= 0)
881 {
ec95d1a6 882 if (*s == '<' && (ispunct(s[1]) || iscntrl(s[1])))
059ec3d9
PH
883 {
884 sep = s[1];
b72f857f 885 if (*++s) ++s;
ec95d1a6 886 while (isspace(*s) && *s != sep) s++;
059ec3d9
PH
887 }
888 else
8b455685 889 sep = sep ? -sep : ':';
059ec3d9
PH
890 *separator = sep;
891 }
892
ec95d1a6
PH
893/* An empty string has no list elements */
894
8b455685 895if (!*s) return NULL;
059ec3d9 896
ec95d1a6
PH
897/* Note whether whether or not the separator is an iscntrl() character. */
898
899sep_is_special = iscntrl(sep);
900
059ec3d9
PH
901/* Handle the case when a buffer is provided. */
902
617d3932 903if (buffer)
059ec3d9 904 {
d4ff61d1 905 int p = 0;
ba74fb8d
JH
906 if (is_tainted(s) && !is_tainted(buffer))
907 die_tainted(US"string_nextinlist", func, line);
8b455685 908 for (; *s; s++)
059ec3d9 909 {
ec95d1a6 910 if (*s == sep && (*(++s) != sep || sep_is_special)) break;
059ec3d9
PH
911 if (p < buflen - 1) buffer[p++] = *s;
912 }
913 while (p > 0 && isspace(buffer[p-1])) p--;
8b455685 914 buffer[p] = '\0';
059ec3d9
PH
915 }
916
917/* Handle the case when a buffer is not provided. */
918
919else
920 {
acec9514 921 gstring * g = NULL;
ec95d1a6 922
059ec3d9 923 /* We know that *s != 0 at this point. However, it might be pointing to a
ec95d1a6
PH
924 separator, which could indicate an empty string, or (if an ispunct()
925 character) could be doubled to indicate a separator character as data at the
926 start of a string. Avoid getting working memory for an empty item. */
059ec3d9
PH
927
928 if (*s == sep)
929 {
930 s++;
ec95d1a6
PH
931 if (*s != sep || sep_is_special)
932 {
933 *listptr = s;
934 return string_copy(US"");
935 }
059ec3d9
PH
936 }
937
ec95d1a6
PH
938 /* Not an empty string; the first character is guaranteed to be a data
939 character. */
940
941 for (;;)
059ec3d9 942 {
d7978c0f
JH
943 const uschar * ss;
944 for (ss = s + 1; *ss && *ss != sep; ) ss++;
acec9514 945 g = string_catn(g, s, ss-s);
ec95d1a6 946 s = ss;
8b455685 947 if (!*s || *++s != sep || sep_is_special) break;
059ec3d9 948 }
acec9514
JH
949 while (g->ptr > 0 && isspace(g->s[g->ptr-1])) g->ptr--;
950 buffer = string_from_gstring(g);
e59797e3 951 gstring_release_unused(g);
059ec3d9
PH
952 }
953
954/* Update the current pointer and return the new string */
955
956*listptr = s;
957return buffer;
958}
059ec3d9
PH
959
960
4226691b
JH
961static const uschar *
962Ustrnchr(const uschar * s, int c, unsigned * len)
963{
964unsigned siz = *len;
965while (siz)
966 {
967 if (!*s) return NULL;
968 if (*s == c)
969 {
970 *len = siz;
971 return s;
972 }
973 s++;
974 siz--;
975 }
976return NULL;
977}
978
979
76146973 980/************************************************
1d9ddac9 981* Add element to separated list *
76146973 982************************************************/
4226691b
JH
983/* This function is used to build a list, returning an allocated null-terminated
984growable string. The given element has any embedded separator characters
76146973
JH
985doubled.
986
4226691b
JH
987Despite having the same growable-string interface as string_cat() the list is
988always returned null-terminated.
989
76146973 990Arguments:
acec9514 991 list expanding-string for the list that is being built, or NULL
76146973 992 if this is a new list that has no contents yet
4c04137d
JS
993 sep list separator character
994 ele new element to be appended to the list
76146973
JH
995
996Returns: pointer to the start of the list, changed if copied for expansion.
997*/
998
acec9514
JH
999gstring *
1000string_append_listele(gstring * list, uschar sep, const uschar * ele)
76146973 1001{
76146973
JH
1002uschar * sp;
1003
acec9514
JH
1004if (list && list->ptr)
1005 list = string_catn(list, &sep, 1);
76146973 1006
e3dd1d67 1007while((sp = Ustrchr(ele, sep)))
76146973 1008 {
acec9514
JH
1009 list = string_catn(list, ele, sp-ele+1);
1010 list = string_catn(list, &sep, 1);
76146973
JH
1011 ele = sp+1;
1012 }
acec9514
JH
1013list = string_cat(list, ele);
1014(void) string_from_gstring(list);
4226691b 1015return list;
76146973 1016}
00ba27c5
JH
1017
1018
acec9514
JH
1019gstring *
1020string_append_listele_n(gstring * list, uschar sep, const uschar * ele,
1021 unsigned len)
00ba27c5 1022{
00ba27c5
JH
1023const uschar * sp;
1024
acec9514
JH
1025if (list && list->ptr)
1026 list = string_catn(list, &sep, 1);
00ba27c5
JH
1027
1028while((sp = Ustrnchr(ele, sep, &len)))
1029 {
acec9514
JH
1030 list = string_catn(list, ele, sp-ele+1);
1031 list = string_catn(list, &sep, 1);
00ba27c5
JH
1032 ele = sp+1;
1033 len--;
1034 }
acec9514
JH
1035list = string_catn(list, ele, len);
1036(void) string_from_gstring(list);
4226691b 1037return list;
00ba27c5 1038}
76146973
JH
1039
1040
059ec3d9 1041
bce15b62
JH
1042/* A slightly-bogus listmaker utility; the separator is a string so
1043can be multiple chars - there is no checking for the element content
1044containing any of the separator. */
1045
1046gstring *
1047string_append2_listele_n(gstring * list, const uschar * sepstr,
1048 const uschar * ele, unsigned len)
1049{
bce15b62
JH
1050if (list && list->ptr)
1051 list = string_cat(list, sepstr);
1052
1053list = string_catn(list, ele, len);
1054(void) string_from_gstring(list);
1055return list;
1056}
1057
1058
1059
acec9514 1060/************************************************/
f3ebb786
JH
1061/* Add more space to a growable-string. The caller should check
1062first if growth is required. The gstring struct is modified on
1063return; specifically, the string-base-pointer may have been changed.
d12746bc
JH
1064
1065Arguments:
1066 g the growable-string
f3ebb786 1067 count amount needed for g->ptr to increase by
938593e9
JH
1068*/
1069
1070static void
f3ebb786 1071gstring_grow(gstring * g, int count)
acec9514 1072{
f3ebb786 1073int p = g->ptr;
acec9514 1074int oldsize = g->size;
f3ebb786 1075BOOL tainted = is_tainted(g->s);
acec9514
JH
1076
1077/* Mostly, string_cat() is used to build small strings of a few hundred
1078characters at most. There are times, however, when the strings are very much
1079longer (for example, a lookup that returns a vast number of alias addresses).
1080To try to keep things reasonable, we use increments whose size depends on the
1081existing length of the string. */
1082
1083unsigned inc = oldsize < 4096 ? 127 : 1023;
f3ebb786
JH
1084
1085if (count <= 0) return;
1086g->size = (p + count + inc + 1) & ~inc; /* one for a NUL */
acec9514
JH
1087
1088/* Try to extend an existing allocation. If the result of calling
1089store_extend() is false, either there isn't room in the current memory block,
1090or this string is not the top item on the dynamic store stack. We then have
1091to get a new chunk of store and copy the old string. When building large
1092strings, it is helpful to call store_release() on the old string, to release
1093memory blocks that have become empty. (The block will be freed if the string
1094is at its start.) However, we can do this only if we know that the old string
1095was the last item on the dynamic memory stack. This is the case if it matches
1096store_last_get. */
1097
f3ebb786
JH
1098if (!store_extend(g->s, tainted, oldsize, g->size))
1099 g->s = store_newblock(g->s, tainted, g->size, p);
acec9514
JH
1100}
1101
1102
1103
d12746bc
JH
1104/*************************************************
1105* Add chars to string *
1106*************************************************/
059ec3d9
PH
1107/* This function is used when building up strings of unknown length. Room is
1108always left for a terminating zero to be added to the string that is being
1109built. This function does not require the string that is being added to be NUL
1110terminated, because the number of characters to add is given explicitly. It is
1111sometimes called to extract parts of other strings.
1112
1113Arguments:
1114 string points to the start of the string that is being built, or NULL
1115 if this is a new string that has no contents yet
059ec3d9
PH
1116 s points to characters to add
1117 count count of characters to add; must not exceed the length of s, if s
42055a33 1118 is a C string.
059ec3d9 1119
059ec3d9
PH
1120Returns: pointer to the start of the string, changed if copied for expansion.
1121 Note that a NUL is not added, though space is left for one. This is
1122 because string_cat() is often called multiple times to build up a
1123 string - there's no point adding the NUL till the end.
a1b8a755 1124
059ec3d9 1125*/
96f5fe4c 1126/* coverity[+alloc] */
059ec3d9 1127
acec9514
JH
1128gstring *
1129string_catn(gstring * g, const uschar *s, int count)
059ec3d9 1130{
acec9514 1131int p;
f3ebb786 1132BOOL srctaint = is_tainted(s);
059ec3d9 1133
acec9514 1134if (!g)
059ec3d9 1135 {
acec9514
JH
1136 unsigned inc = count < 4096 ? 127 : 1023;
1137 unsigned size = ((count + inc) & ~inc) + 1;
f3ebb786 1138 g = string_get_tainted(size, srctaint);
059ec3d9 1139 }
f3ebb786
JH
1140else if (srctaint && !is_tainted(g->s))
1141 gstring_rebuffer(g);
059ec3d9 1142
acec9514
JH
1143p = g->ptr;
1144if (p + count >= g->size)
f3ebb786 1145 gstring_grow(g, count);
acec9514 1146
059ec3d9
PH
1147/* Because we always specify the exact number of characters to copy, we can
1148use memcpy(), which is likely to be more efficient than strncopy() because the
acec9514 1149latter has to check for zero bytes. */
059ec3d9 1150
acec9514
JH
1151memcpy(g->s + p, s, count);
1152g->ptr = p + count;
1153return g;
059ec3d9 1154}
c3aefacc
HSHR
1155
1156
acec9514
JH
1157gstring *
1158string_cat(gstring *string, const uschar *s)
c2f669a4 1159{
acec9514 1160return string_catn(string, s, Ustrlen(s));
c2f669a4 1161}
059ec3d9
PH
1162
1163
1164
059ec3d9
PH
1165/*************************************************
1166* Append strings to another string *
1167*************************************************/
1168
1169/* This function can be used to build a string from many other strings.
1170It calls string_cat() to do the dirty work.
1171
1172Arguments:
acec9514 1173 string expanding-string that is being built, or NULL
059ec3d9 1174 if this is a new string that has no contents yet
059ec3d9
PH
1175 count the number of strings to append
1176 ... "count" uschar* arguments, which must be valid zero-terminated
1177 C strings
1178
1179Returns: pointer to the start of the string, changed if copied for expansion.
1180 The string is not zero-terminated - see string_cat() above.
1181*/
1182
acec9514
JH
1183__inline__ gstring *
1184string_append(gstring *string, int count, ...)
059ec3d9
PH
1185{
1186va_list ap;
059ec3d9
PH
1187
1188va_start(ap, count);
acec9514 1189while (count-- > 0)
059ec3d9
PH
1190 {
1191 uschar *t = va_arg(ap, uschar *);
acec9514 1192 string = string_cat(string, t);
059ec3d9
PH
1193 }
1194va_end(ap);
1195
1196return string;
1197}
1198#endif
1199
1200
1201
1202/*************************************************
1203* Format a string with length checks *
1204*************************************************/
1205
1206/* This function is used to format a string with checking of the length of the
1207output for all conversions. It protects Exim from absent-mindedness when
1208calling functions like debug_printf and string_sprintf, and elsewhere. There
1209are two different entry points to what is actually the same function, depending
1210on whether the variable length list of data arguments are given explicitly or
1211as a va_list item.
1212
1213The formats are the usual printf() ones, with some omissions (never used) and
c0b9d3e8 1214three additions for strings: %S forces lower case, %T forces upper case, and
acec9514 1215%#s or %#S prints nothing for a NULL string. Without the # "NULL" is printed
c0b9d3e8
JH
1216(useful in debugging). There is also the addition of %D and %M, which insert
1217the date in the form used for datestamped log files.
059ec3d9
PH
1218
1219Arguments:
1220 buffer a buffer in which to put the formatted string
1221 buflen the length of the buffer
1222 format the format string - deliberately char * and not uschar *
1223 ... or ap variable list of supplementary arguments
1224
1225Returns: TRUE if the result fitted in the buffer
1226*/
1227
1228BOOL
f3ebb786
JH
1229string_format_trc(uschar * buffer, int buflen,
1230 const uschar * func, unsigned line, const char * format, ...)
059ec3d9 1231{
d12746bc 1232gstring g = { .size = buflen, .ptr = 0, .s = buffer }, *gp;
059ec3d9
PH
1233va_list ap;
1234va_start(ap, format);
f3ebb786
JH
1235gp = string_vformat_trc(&g, func, line, STRING_SPRINTF_BUFFER_SIZE,
1236 0, format, ap);
059ec3d9 1237va_end(ap);
d12746bc
JH
1238g.s[g.ptr] = '\0';
1239return !!gp;
059ec3d9
PH
1240}
1241
1242
d12746bc 1243
d12746bc 1244
f3ebb786 1245/* Build or append to a growing-string, sprintf-style.
d12746bc 1246
b273058b
JH
1247Arguments:
1248 g a growable-string
1249 func called-from function name, for debug
1250 line called-from file line number, for debug
1251 limit maximum string size
1252 flags see below
1253 format printf-like format string
1254 ap variable-args pointer
1255
1256Flags:
1257 SVFMT_EXTEND buffer can be created or exteded as needed
1258 SVFMT_REBUFFER buffer can be recopied to tainted mem as needed
1259 SVFMT_TAINT_NOCHK do not check inputs for taint
1260
f3ebb786
JH
1261If the "extend" flag is true, the string passed in can be NULL,
1262empty, or non-empty. Growing is subject to an overall limit given
b273058b 1263by the limit argument.
d12746bc 1264
f3ebb786 1265If the "extend" flag is false, the string passed in may not be NULL,
d12746bc
JH
1266will not be grown, and is usable in the original place after return.
1267The return value can be NULL to signify overflow.
1268
adc4ecf9
JH
1269Returns the possibly-new (if copy for growth or taint-handling was needed)
1270string, not nul-terminated.
d12746bc
JH
1271*/
1272
1273gstring *
f3ebb786
JH
1274string_vformat_trc(gstring * g, const uschar * func, unsigned line,
1275 unsigned size_limit, unsigned flags, const char *format, va_list ap)
059ec3d9 1276{
d12746bc
JH
1277enum ltypes { L_NORMAL=1, L_SHORT=2, L_LONG=3, L_LONGLONG=4, L_LONGDOUBLE=5, L_SIZE=6 };
1278
f3ebb786 1279int width, precision, off, lim, need;
d12746bc 1280const char * fp = format; /* Deliberately not unsigned */
f3ebb786 1281BOOL dest_tainted = FALSE;
b1c749bb 1282
d12746bc
JH
1283string_datestamp_offset = -1; /* Datestamp not inserted */
1284string_datestamp_length = 0; /* Datestamp not inserted */
1285string_datestamp_type = 0; /* Datestamp not inserted */
059ec3d9 1286
d12746bc 1287#ifdef COMPILE_UTILITY
f3ebb786 1288assert(!(flags & SVFMT_EXTEND));
d12746bc
JH
1289assert(g);
1290#else
1291
1292/* Ensure we have a string, to save on checking later */
1293if (!g) g = string_get(16);
f3ebb786
JH
1294else if (!(flags & SVFMT_TAINT_NOCHK)) dest_tainted = is_tainted(g->s);
1295
1296if (!(flags & SVFMT_TAINT_NOCHK) && !dest_tainted && is_tainted(format))
1297 {
aaabfafe 1298#ifndef MACRO_PREDEF
f3ebb786
JH
1299 if (!(flags & SVFMT_REBUFFER))
1300 die_tainted(US"string_vformat", func, line);
aaabfafe 1301#endif
f3ebb786
JH
1302 gstring_rebuffer(g);
1303 dest_tainted = TRUE;
1304 }
d12746bc
JH
1305#endif /*!COMPILE_UTILITY*/
1306
1307lim = g->size - 1; /* leave one for a nul */
1308off = g->ptr; /* remember initial offset in gstring */
059ec3d9
PH
1309
1310/* Scan the format and handle the insertions */
1311
d12746bc 1312while (*fp)
059ec3d9 1313 {
b1c749bb 1314 int length = L_NORMAL;
059ec3d9
PH
1315 int *nptr;
1316 int slen;
d12746bc
JH
1317 const char *null = "NULL"; /* ) These variables */
1318 const char *item_start, *s; /* ) are deliberately */
1319 char newformat[16]; /* ) not unsigned */
1320 char * gp = CS g->s + g->ptr; /* ) */
059ec3d9
PH
1321
1322 /* Non-% characters just get copied verbatim */
1323
1324 if (*fp != '%')
1325 {
d12746bc 1326 /* Avoid string_copyn() due to COMPILE_UTILITY */
f3ebb786 1327 if ((need = g->ptr + 1) > lim)
1100a343 1328 {
f3ebb786
JH
1329 if (!(flags & SVFMT_EXTEND) || need > size_limit) return NULL;
1330 gstring_grow(g, 1);
1100a343
JH
1331 lim = g->size - 1;
1332 }
d12746bc 1333 g->s[g->ptr++] = (uschar) *fp++;
059ec3d9
PH
1334 continue;
1335 }
1336
1337 /* Deal with % characters. Pick off the width and precision, for checking
1338 strings, skipping over the flag and modifier characters. */
1339
1340 item_start = fp;
1341 width = precision = -1;
1342
1343 if (strchr("-+ #0", *(++fp)) != NULL)
1344 {
1345 if (*fp == '#') null = "";
1346 fp++;
1347 }
1348
1349 if (isdigit((uschar)*fp))
1350 {
1351 width = *fp++ - '0';
1352 while (isdigit((uschar)*fp)) width = width * 10 + *fp++ - '0';
1353 }
1354 else if (*fp == '*')
1355 {
1356 width = va_arg(ap, int);
1357 fp++;
1358 }
1359
1360 if (*fp == '.')
059ec3d9
PH
1361 if (*(++fp) == '*')
1362 {
1363 precision = va_arg(ap, int);
1364 fp++;
1365 }
1366 else
d12746bc
JH
1367 for (precision = 0; isdigit((uschar)*fp); fp++)
1368 precision = precision*10 + *fp - '0';
059ec3d9 1369
91a246f6 1370 /* Skip over 'h', 'L', 'l', 'll' and 'z', remembering the item length */
b1c749bb
PH
1371
1372 if (*fp == 'h')
1373 { fp++; length = L_SHORT; }
1374 else if (*fp == 'L')
1375 { fp++; length = L_LONGDOUBLE; }
1376 else if (*fp == 'l')
b1c749bb 1377 if (fp[1] == 'l')
d12746bc 1378 { fp += 2; length = L_LONGLONG; }
b1c749bb 1379 else
d12746bc 1380 { fp++; length = L_LONG; }
91a246f6
PP
1381 else if (*fp == 'z')
1382 { fp++; length = L_SIZE; }
059ec3d9
PH
1383
1384 /* Handle each specific format type. */
1385
1386 switch (*fp++)
1387 {
1388 case 'n':
d12746bc
JH
1389 nptr = va_arg(ap, int *);
1390 *nptr = g->ptr - off;
1391 break;
059ec3d9
PH
1392
1393 case 'd':
1394 case 'o':
1395 case 'u':
1396 case 'x':
1397 case 'X':
d12746bc 1398 width = length > L_LONG ? 24 : 12;
f3ebb786 1399 if ((need = g->ptr + width) > lim)
1100a343 1400 {
f3ebb786
JH
1401 if (!(flags & SVFMT_EXTEND) || need >= size_limit) return NULL;
1402 gstring_grow(g, width);
1100a343
JH
1403 lim = g->size - 1;
1404 gp = CS g->s + g->ptr;
1405 }
d12746bc
JH
1406 strncpy(newformat, item_start, fp - item_start);
1407 newformat[fp - item_start] = 0;
b1c749bb 1408
d12746bc
JH
1409 /* Short int is promoted to int when passing through ..., so we must use
1410 int for va_arg(). */
b1c749bb 1411
d12746bc
JH
1412 switch(length)
1413 {
1414 case L_SHORT:
1415 case L_NORMAL:
1416 g->ptr += sprintf(gp, newformat, va_arg(ap, int)); break;
1417 case L_LONG:
1418 g->ptr += sprintf(gp, newformat, va_arg(ap, long int)); break;
1419 case L_LONGLONG:
1420 g->ptr += sprintf(gp, newformat, va_arg(ap, LONGLONG_T)); break;
1421 case L_SIZE:
1422 g->ptr += sprintf(gp, newformat, va_arg(ap, size_t)); break;
1423 }
1424 break;
059ec3d9
PH
1425
1426 case 'p':
2e8db779
JH
1427 {
1428 void * ptr;
f3ebb786 1429 if ((need = g->ptr + 24) > lim)
1100a343 1430 {
f3ebb786
JH
1431 if (!(flags & SVFMT_EXTEND || need >= size_limit)) return NULL;
1432 gstring_grow(g, 24);
1100a343
JH
1433 lim = g->size - 1;
1434 gp = CS g->s + g->ptr;
1435 }
81f358da
JH
1436 /* sprintf() saying "(nil)" for a null pointer seems unreliable.
1437 Handle it explicitly. */
2e8db779
JH
1438 if ((ptr = va_arg(ap, void *)))
1439 {
1440 strncpy(newformat, item_start, fp - item_start);
1441 newformat[fp - item_start] = 0;
d12746bc 1442 g->ptr += sprintf(gp, newformat, ptr);
2e8db779
JH
1443 }
1444 else
d12746bc 1445 g->ptr += sprintf(gp, "(nil)");
2e8db779 1446 }
059ec3d9
PH
1447 break;
1448
1449 /* %f format is inherently insecure if the numbers that it may be
870f6ba8
TF
1450 handed are unknown (e.g. 1e300). However, in Exim, %f is used for
1451 printing load averages, and these are actually stored as integers
1452 (load average * 1000) so the size of the numbers is constrained.
1453 It is also used for formatting sending rates, where the simplicity
1454 of the format prevents overflow. */
059ec3d9
PH
1455
1456 case 'f':
1457 case 'e':
1458 case 'E':
1459 case 'g':
1460 case 'G':
d12746bc 1461 if (precision < 0) precision = 6;
f3ebb786 1462 if ((need = g->ptr + precision + 8) > lim)
1100a343 1463 {
f3ebb786
JH
1464 if (!(flags & SVFMT_EXTEND || need >= size_limit)) return NULL;
1465 gstring_grow(g, precision+8);
1100a343
JH
1466 lim = g->size - 1;
1467 gp = CS g->s + g->ptr;
1468 }
d12746bc
JH
1469 strncpy(newformat, item_start, fp - item_start);
1470 newformat[fp-item_start] = 0;
1471 if (length == L_LONGDOUBLE)
1472 g->ptr += sprintf(gp, newformat, va_arg(ap, long double));
1473 else
1474 g->ptr += sprintf(gp, newformat, va_arg(ap, double));
1475 break;
059ec3d9
PH
1476
1477 /* String types */
1478
1479 case '%':
f3ebb786 1480 if ((need = g->ptr + 1) > lim)
1100a343 1481 {
f3ebb786
JH
1482 if (!(flags & SVFMT_EXTEND || need >= size_limit)) return NULL;
1483 gstring_grow(g, 1);
1100a343
JH
1484 lim = g->size - 1;
1485 }
d12746bc
JH
1486 g->s[g->ptr++] = (uschar) '%';
1487 break;
059ec3d9
PH
1488
1489 case 'c':
f3ebb786 1490 if ((need = g->ptr + 1) > lim)
1100a343 1491 {
f3ebb786
JH
1492 if (!(flags & SVFMT_EXTEND || need >= size_limit)) return NULL;
1493 gstring_grow(g, 1);
1100a343
JH
1494 lim = g->size - 1;
1495 }
d12746bc
JH
1496 g->s[g->ptr++] = (uschar) va_arg(ap, int);
1497 break;
059ec3d9 1498
f1e5fef5 1499 case 'D': /* Insert daily datestamp for log file names */
d12746bc
JH
1500 s = CS tod_stamp(tod_log_datestamp_daily);
1501 string_datestamp_offset = g->ptr; /* Passed back via global */
1502 string_datestamp_length = Ustrlen(s); /* Passed back via global */
1503 string_datestamp_type = tod_log_datestamp_daily;
1504 slen = string_datestamp_length;
1505 goto INSERT_STRING;
f1e5fef5
PP
1506
1507 case 'M': /* Insert monthly datestamp for log file names */
d12746bc
JH
1508 s = CS tod_stamp(tod_log_datestamp_monthly);
1509 string_datestamp_offset = g->ptr; /* Passed back via global */
1510 string_datestamp_length = Ustrlen(s); /* Passed back via global */
1511 string_datestamp_type = tod_log_datestamp_monthly;
1512 slen = string_datestamp_length;
1513 goto INSERT_STRING;
059ec3d9
PH
1514
1515 case 's':
1516 case 'S': /* Forces *lower* case */
c0b9d3e8 1517 case 'T': /* Forces *upper* case */
d12746bc 1518 s = va_arg(ap, char *);
059ec3d9 1519
d12746bc
JH
1520 if (!s) s = null;
1521 slen = Ustrlen(s);
059ec3d9 1522
f3ebb786
JH
1523 if (!(flags & SVFMT_TAINT_NOCHK) && !dest_tainted && is_tainted(s))
1524 if (flags & SVFMT_REBUFFER)
1525 {
1526 gstring_rebuffer(g);
1527 gp = CS g->s + g->ptr;
1528 dest_tainted = TRUE;
1529 }
aaabfafe 1530#ifndef MACRO_PREDEF
f3ebb786
JH
1531 else
1532 die_tainted(US"string_vformat", func, line);
aaabfafe 1533#endif
f3ebb786 1534
f1e5fef5
PP
1535 INSERT_STRING: /* Come to from %D or %M above */
1536
059ec3d9 1537 {
d12746bc 1538 BOOL truncated = FALSE;
059ec3d9 1539
d12746bc
JH
1540 /* If the width is specified, check that there is a precision
1541 set; if not, set it to the width to prevent overruns of long
1542 strings. */
059ec3d9 1543
d12746bc
JH
1544 if (width >= 0)
1545 {
1546 if (precision < 0) precision = width;
1547 }
059ec3d9 1548
d12746bc
JH
1549 /* If a width is not specified and the precision is specified, set
1550 the width to the precision, or the string length if shorted. */
059ec3d9 1551
d12746bc
JH
1552 else if (precision >= 0)
1553 width = precision < slen ? precision : slen;
059ec3d9 1554
d12746bc 1555 /* If neither are specified, set them both to the string length. */
059ec3d9 1556
d12746bc
JH
1557 else
1558 width = precision = slen;
1559
f3ebb786 1560 if ((need = g->ptr + width) >= size_limit || !(flags & SVFMT_EXTEND))
d12746bc
JH
1561 {
1562 if (g->ptr == lim) return NULL;
f3ebb786 1563 if (need > lim)
d12746bc
JH
1564 {
1565 truncated = TRUE;
1566 width = precision = lim - g->ptr - 1;
1567 if (width < 0) width = 0;
1568 if (precision < 0) precision = 0;
1569 }
1570 }
f3ebb786 1571 else if (need > lim)
1100a343 1572 {
f3ebb786 1573 gstring_grow(g, width);
1100a343
JH
1574 lim = g->size - 1;
1575 gp = CS g->s + g->ptr;
1576 }
d12746bc
JH
1577
1578 g->ptr += sprintf(gp, "%*.*s", width, precision, s);
1579 if (fp[-1] == 'S')
1580 while (*gp) { *gp = tolower(*gp); gp++; }
1581 else if (fp[-1] == 'T')
1582 while (*gp) { *gp = toupper(*gp); gp++; }
1583
1584 if (truncated) return NULL;
1585 break;
059ec3d9 1586 }
059ec3d9
PH
1587
1588 /* Some things are never used in Exim; also catches junk. */
1589
1590 default:
d12746bc
JH
1591 strncpy(newformat, item_start, fp - item_start);
1592 newformat[fp-item_start] = 0;
1593 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "string_format: unsupported type "
1594 "in \"%s\" in \"%s\"", newformat, format);
1595 break;
059ec3d9
PH
1596 }
1597 }
1598
f3ebb786
JH
1599if (g->ptr > g->size)
1600 log_write(0, LOG_MAIN|LOG_PANIC_DIE,
1601 "string_format internal error: caller %s %d", func, line);
d12746bc
JH
1602return g;
1603}
059ec3d9 1604
059ec3d9 1605
d12746bc
JH
1606
1607#ifndef COMPILE_UTILITY
059ec3d9
PH
1608/*************************************************
1609* Generate an "open failed" message *
1610*************************************************/
1611
1612/* This function creates a message after failure to open a file. It includes a
1613string supplied as data, adds the strerror() text, and if the failure was
1614"Permission denied", reads and includes the euid and egid.
1615
1616Arguments:
1617 eno the value of errno after the failure
1618 format a text format string - deliberately not uschar *
1619 ... arguments for the format string
1620
1621Returns: a message, in dynamic store
1622*/
1623
1624uschar *
f3ebb786
JH
1625string_open_failed_trc(int eno, const uschar * func, unsigned line,
1626 const char *format, ...)
059ec3d9
PH
1627{
1628va_list ap;
d12746bc 1629gstring * g = string_get(1024);
059ec3d9 1630
d12746bc 1631g = string_catn(g, US"failed to open ", 15);
059ec3d9
PH
1632
1633/* Use the checked formatting routine to ensure that the buffer
1634does not overflow. It should not, since this is called only for internally
1635specified messages. If it does, the message just gets truncated, and there
1636doesn't seem much we can do about that. */
1637
d12746bc 1638va_start(ap, format);
f3ebb786 1639(void) string_vformat_trc(g, func, line, STRING_SPRINTF_BUFFER_SIZE,
ba74fb8d 1640 SVFMT_REBUFFER, format, ap);
d12746bc 1641string_from_gstring(g);
e59797e3 1642gstring_release_unused(g);
cb570b5e 1643va_end(ap);
059ec3d9 1644
d12746bc
JH
1645return eno == EACCES
1646 ? string_sprintf("%s: %s (euid=%ld egid=%ld)", g->s, strerror(eno),
1647 (long int)geteuid(), (long int)getegid())
1648 : string_sprintf("%s: %s", g->s, strerror(eno));
059ec3d9
PH
1649}
1650#endif /* COMPILE_UTILITY */
1651
1652
1653
059ec3d9
PH
1654
1655
bc3c7bb7
HSHR
1656#ifndef COMPILE_UTILITY
1657/* qsort(3), currently used to sort the environment variables
1658for -bP environment output, needs a function to compare two pointers to string
1659pointers. Here it is. */
1660
1661int
84bbb4d8 1662string_compare_by_pointer(const void *a, const void *b)
bc3c7bb7 1663{
35a5627d 1664return Ustrcmp(* CUSS a, * CUSS b);
bc3c7bb7
HSHR
1665}
1666#endif /* COMPILE_UTILITY */
059ec3d9
PH
1667
1668
1669
d12746bc 1670
059ec3d9
PH
1671/*************************************************
1672**************************************************
1673* Stand-alone test program *
1674**************************************************
1675*************************************************/
1676
1677#ifdef STAND_ALONE
1678int main(void)
1679{
1680uschar buffer[256];
1681
1682printf("Testing is_ip_address\n");
1683
1684while (fgets(CS buffer, sizeof(buffer), stdin) != NULL)
1685 {
1686 int offset;
1687 buffer[Ustrlen(buffer) - 1] = 0;
1688 printf("%d\n", string_is_ip_address(buffer, NULL));
1689 printf("%d %d %s\n", string_is_ip_address(buffer, &offset), offset, buffer);
1690 }
1691
1692printf("Testing string_nextinlist\n");
1693
1694while (fgets(CS buffer, sizeof(buffer), stdin) != NULL)
1695 {
1696 uschar *list = buffer;
1697 uschar *lp1, *lp2;
1698 uschar item[256];
1699 int sep1 = 0;
1700 int sep2 = 0;
1701
1702 if (*list == '<')
1703 {
1704 sep1 = sep2 = list[1];
1705 list += 2;
1706 }
1707
1708 lp1 = lp2 = list;
1709 for (;;)
1710 {
1711 uschar *item1 = string_nextinlist(&lp1, &sep1, item, sizeof(item));
1712 uschar *item2 = string_nextinlist(&lp2, &sep2, NULL, 0);
1713
1714 if (item1 == NULL && item2 == NULL) break;
1715 if (item == NULL || item2 == NULL || Ustrcmp(item1, item2) != 0)
1716 {
1717 printf("***ERROR\nitem1=\"%s\"\nitem2=\"%s\"\n",
1718 (item1 == NULL)? "NULL" : CS item1,
1719 (item2 == NULL)? "NULL" : CS item2);
1720 break;
1721 }
1722 else printf(" \"%s\"\n", CS item1);
1723 }
1724 }
1725
1726/* This is a horrible lash-up, but it serves its purpose. */
1727
1728printf("Testing string_format\n");
1729
1730while (fgets(CS buffer, sizeof(buffer), stdin) != NULL)
1731 {
1732 void *args[3];
ed72ace5 1733 long long llargs[3];
059ec3d9
PH
1734 double dargs[3];
1735 int dflag = 0;
ed72ace5 1736 int llflag = 0;
059ec3d9
PH
1737 int n = 0;
1738 int count;
1739 int countset = 0;
1740 uschar format[256];
1741 uschar outbuf[256];
1742 uschar *s;
1743 buffer[Ustrlen(buffer) - 1] = 0;
1744
1745 s = Ustrchr(buffer, ',');
1746 if (s == NULL) s = buffer + Ustrlen(buffer);
1747
1748 Ustrncpy(format, buffer, s - buffer);
1749 format[s-buffer] = 0;
1750
1751 if (*s == ',') s++;
1752
1753 while (*s != 0)
1754 {
1755 uschar *ss = s;
1756 s = Ustrchr(ss, ',');
1757 if (s == NULL) s = ss + Ustrlen(ss);
1758
1759 if (isdigit(*ss))
1760 {
1761 Ustrncpy(outbuf, ss, s-ss);
1762 if (Ustrchr(outbuf, '.') != NULL)
1763 {
1764 dflag = 1;
1765 dargs[n++] = Ustrtod(outbuf, NULL);
1766 }
ed72ace5
PH
1767 else if (Ustrstr(outbuf, "ll") != NULL)
1768 {
1769 llflag = 1;
1770 llargs[n++] = strtoull(CS outbuf, NULL, 10);
1771 }
059ec3d9
PH
1772 else
1773 {
1774 args[n++] = (void *)Uatoi(outbuf);
1775 }
1776 }
1777
1778 else if (Ustrcmp(ss, "*") == 0)
1779 {
1780 args[n++] = (void *)(&count);
1781 countset = 1;
1782 }
1783
1784 else
1785 {
1786 uschar *sss = malloc(s - ss + 1);
1787 Ustrncpy(sss, ss, s-ss);
1788 args[n++] = sss;
1789 }
1790
1791 if (*s == ',') s++;
1792 }
1793
ed72ace5
PH
1794 if (!dflag && !llflag)
1795 printf("%s\n", string_format(outbuf, sizeof(outbuf), CS format,
1796 args[0], args[1], args[2])? "True" : "False");
1797
1798 else if (dflag)
1799 printf("%s\n", string_format(outbuf, sizeof(outbuf), CS format,
1800 dargs[0], dargs[1], dargs[2])? "True" : "False");
059ec3d9
PH
1801
1802 else printf("%s\n", string_format(outbuf, sizeof(outbuf), CS format,
ed72ace5 1803 llargs[0], llargs[1], llargs[2])? "True" : "False");
059ec3d9
PH
1804
1805 printf("%s\n", CS outbuf);
1806 if (countset) printf("count=%d\n", count);
1807 }
1808
1809return 0;
1810}
1811#endif
1812
1813/* End of string.c */