Revert "GnuTLS: remove GNUTLS_E_AGAIN handling"
[exim.git] / src / src / string.c
CommitLineData
059ec3d9
PH
1/*************************************************
2* Exim - an Internet mail transport agent *
3*************************************************/
4
f9ba5e22 5/* Copyright (c) University of Cambridge 1995 - 2018 */
059ec3d9
PH
6/* See the file NOTICE for conditions of use and distribution. */
7
8/* Miscellaneous string-handling functions. Some are not required for
9utilities and tests, and are cut out by the COMPILE_UTILITY macro. */
10
11
12#include "exim.h"
d12746bc 13#include <assert.h>
059ec3d9 14
f3ebb786 15static void gstring_rebuffer(gstring * g);
059ec3d9
PH
16
17#ifndef COMPILE_UTILITY
18/*************************************************
19* Test for IP address *
20*************************************************/
21
22/* This used just to be a regular expression, but with IPv6 things are a bit
23more complicated. If the address contains a colon, it is assumed to be a v6
24address (assuming HAVE_IPV6 is set). If a mask is permitted and one is present,
25and maskptr is not NULL, its offset is placed there.
26
27Arguments:
28 s a string
29 maskptr NULL if no mask is permitted to follow
30 otherwise, points to an int where the offset of '/' is placed
1688f43b 31 if there is no / followed by trailing digits, *maskptr is set 0
059ec3d9
PH
32
33Returns: 0 if the string is not a textual representation of an IP address
34 4 if it is an IPv4 address
35 6 if it is an IPv6 address
36*/
37
38int
b1f8e4f8 39string_is_ip_address(const uschar *s, int *maskptr)
059ec3d9 40{
059ec3d9
PH
41int yield = 4;
42
43/* If an optional mask is permitted, check for it. If found, pass back the
44offset. */
45
8d909960 46if (maskptr)
059ec3d9 47 {
b1f8e4f8 48 const uschar *ss = s + Ustrlen(s);
059ec3d9
PH
49 *maskptr = 0;
50 if (s != ss && isdigit(*(--ss)))
51 {
52 while (ss > s && isdigit(ss[-1])) ss--;
53 if (ss > s && *(--ss) == '/') *maskptr = ss - s;
54 }
55 }
56
57/* A colon anywhere in the string => IPv6 address */
58
59if (Ustrchr(s, ':') != NULL)
60 {
61 BOOL had_double_colon = FALSE;
62 BOOL v4end = FALSE;
059ec3d9
PH
63
64 yield = 6;
65
66 /* An IPv6 address must start with hex digit or double colon. A single
67 colon is invalid. */
68
69 if (*s == ':' && *(++s) != ':') return 0;
70
71 /* Now read up to 8 components consisting of up to 4 hex digits each. There
72 may be one and only one appearance of double colon, which implies any number
73 of binary zero bits. The number of preceding components is held in count. */
74
d7978c0f 75 for (int count = 0; count < 8; count++)
059ec3d9
PH
76 {
77 /* If the end of the string is reached before reading 8 components, the
78 address is valid provided a double colon has been read. This also applies
79 if we hit the / that introduces a mask or the % that introduces the
80 interface specifier (scope id) of a link-local address. */
81
8d909960 82 if (*s == 0 || *s == '%' || *s == '/') return had_double_colon ? yield : 0;
059ec3d9
PH
83
84 /* If a component starts with an additional colon, we have hit a double
85 colon. This is permitted to appear once only, and counts as at least
86 one component. The final component may be of this form. */
87
88 if (*s == ':')
89 {
90 if (had_double_colon) return 0;
91 had_double_colon = TRUE;
92 s++;
93 continue;
94 }
95
96 /* If the remainder of the string contains a dot but no colons, we
97 can expect a trailing IPv4 address. This is valid if either there has
98 been no double-colon and this is the 7th component (with the IPv4 address
99 being the 7th & 8th components), OR if there has been a double-colon
100 and fewer than 6 components. */
101
102 if (Ustrchr(s, ':') == NULL && Ustrchr(s, '.') != NULL)
103 {
104 if ((!had_double_colon && count != 6) ||
105 (had_double_colon && count > 6)) return 0;
106 v4end = TRUE;
107 yield = 6;
108 break;
109 }
110
111 /* Check for at least one and not more than 4 hex digits for this
112 component. */
113
114 if (!isxdigit(*s++)) return 0;
115 if (isxdigit(*s) && isxdigit(*(++s)) && isxdigit(*(++s))) s++;
116
117 /* If the component is terminated by colon and there is more to
118 follow, skip over the colon. If there is no more to follow the address is
119 invalid. */
120
121 if (*s == ':' && *(++s) == 0) return 0;
122 }
123
124 /* If about to handle a trailing IPv4 address, drop through. Otherwise
125 all is well if we are at the end of the string or at the mask or at a percent
126 sign, which introduces the interface specifier (scope id) of a link local
127 address. */
128
1688f43b
PH
129 if (!v4end)
130 return (*s == 0 || *s == '%' ||
131 (*s == '/' && maskptr != NULL && *maskptr != 0))? yield : 0;
059ec3d9
PH
132 }
133
134/* Test for IPv4 address, which may be the tail-end of an IPv6 address. */
135
d7978c0f 136for (int i = 0; i < 4; i++)
059ec3d9 137 {
8d909960
JH
138 long n;
139 uschar * end;
140
059ec3d9 141 if (i != 0 && *s++ != '.') return 0;
8d909960
JH
142 n = strtol(CCS s, CSS &end, 10);
143 if (n > 255 || n < 0 || end <= s || end > s+3) return 0;
144 s = end;
059ec3d9
PH
145 }
146
8d909960 147return !*s || (*s == '/' && maskptr && *maskptr != 0) ? yield : 0;
059ec3d9
PH
148}
149#endif /* COMPILE_UTILITY */
150
151
152/*************************************************
153* Format message size *
154*************************************************/
155
156/* Convert a message size in bytes to printing form, rounding
157according to the magnitude of the number. A value of zero causes
158a string of spaces to be returned.
159
160Arguments:
161 size the message size in bytes
162 buffer where to put the answer
163
164Returns: pointer to the buffer
165 a string of exactly 5 characters is normally returned
166*/
167
168uschar *
169string_format_size(int size, uschar *buffer)
170{
f3ebb786 171if (size == 0) Ustrcpy(buffer, US" ");
059ec3d9
PH
172else if (size < 1024) sprintf(CS buffer, "%5d", size);
173else if (size < 10*1024)
174 sprintf(CS buffer, "%4.1fK", (double)size / 1024.0);
175else if (size < 1024*1024)
176 sprintf(CS buffer, "%4dK", (size + 512)/1024);
177else if (size < 10*1024*1024)
178 sprintf(CS buffer, "%4.1fM", (double)size / (1024.0 * 1024.0));
179else
180 sprintf(CS buffer, "%4dM", (size + 512 * 1024)/(1024*1024));
181return buffer;
182}
183
184
185
186#ifndef COMPILE_UTILITY
187/*************************************************
188* Convert a number to base 62 format *
189*************************************************/
190
191/* Convert a long integer into an ASCII base 62 string. For Cygwin the value of
192BASE_62 is actually 36. Always return exactly 6 characters plus zero, in a
193static area.
194
195Argument: a long integer
196Returns: pointer to base 62 string
197*/
198
199uschar *
200string_base62(unsigned long int value)
201{
202static uschar yield[7];
203uschar *p = yield + sizeof(yield) - 1;
204*p = 0;
205while (p > yield)
206 {
207 *(--p) = base62_chars[value % BASE_62];
208 value /= BASE_62;
209 }
210return yield;
211}
212#endif /* COMPILE_UTILITY */
213
214
215
059ec3d9
PH
216/*************************************************
217* Interpret escape sequence *
218*************************************************/
219
220/* This function is called from several places where escape sequences are to be
221interpreted in strings.
222
223Arguments:
224 pp points a pointer to the initiating "\" in the string;
225 the pointer gets updated to point to the final character
c3aefacc
HSHR
226 If the backslash is the last character in the string, it
227 is not interpreted.
059ec3d9
PH
228Returns: the value of the character escape
229*/
230
231int
55414b25 232string_interpret_escape(const uschar **pp)
059ec3d9 233{
3fb3c68d
JH
234#ifdef COMPILE_UTILITY
235const uschar *hex_digits= CUS"0123456789abcdef";
236#endif
059ec3d9 237int ch;
55414b25 238const uschar *p = *pp;
059ec3d9 239ch = *(++p);
c3aefacc 240if (ch == '\0') return **pp;
059ec3d9
PH
241if (isdigit(ch) && ch != '8' && ch != '9')
242 {
243 ch -= '0';
244 if (isdigit(p[1]) && p[1] != '8' && p[1] != '9')
245 {
246 ch = ch * 8 + *(++p) - '0';
247 if (isdigit(p[1]) && p[1] != '8' && p[1] != '9')
248 ch = ch * 8 + *(++p) - '0';
249 }
250 }
251else switch(ch)
252 {
c7396ac5
PP
253 case 'b': ch = '\b'; break;
254 case 'f': ch = '\f'; break;
059ec3d9
PH
255 case 'n': ch = '\n'; break;
256 case 'r': ch = '\r'; break;
257 case 't': ch = '\t'; break;
c7396ac5 258 case 'v': ch = '\v'; break;
059ec3d9
PH
259 case 'x':
260 ch = 0;
261 if (isxdigit(p[1]))
262 {
263 ch = ch * 16 +
264 Ustrchr(hex_digits, tolower(*(++p))) - hex_digits;
265 if (isxdigit(p[1])) ch = ch * 16 +
266 Ustrchr(hex_digits, tolower(*(++p))) - hex_digits;
267 }
268 break;
269 }
270*pp = p;
271return ch;
272}
059ec3d9
PH
273
274
275
276#ifndef COMPILE_UTILITY
277/*************************************************
278* Ensure string is printable *
279*************************************************/
280
281/* This function is called for critical strings. It checks for any
282non-printing characters, and if any are found, it makes a new copy
283of the string with suitable escape sequences. It is most often called by the
284macro string_printing(), which sets allow_tab TRUE.
285
286Arguments:
287 s the input string
288 allow_tab TRUE to allow tab as a printing character
289
290Returns: string with non-printers encoded as printing sequences
291*/
292
55414b25
JH
293const uschar *
294string_printing2(const uschar *s, BOOL allow_tab)
059ec3d9
PH
295{
296int nonprintcount = 0;
297int length = 0;
55414b25 298const uschar *t = s;
059ec3d9
PH
299uschar *ss, *tt;
300
301while (*t != 0)
302 {
303 int c = *t++;
304 if (!mac_isprint(c) || (!allow_tab && c == '\t')) nonprintcount++;
305 length++;
306 }
307
308if (nonprintcount == 0) return s;
309
310/* Get a new block of store guaranteed big enough to hold the
311expanded string. */
312
f3ebb786 313ss = store_get(length + nonprintcount * 3 + 1, is_tainted(s));
059ec3d9 314
4c04137d 315/* Copy everything, escaping non printers. */
059ec3d9
PH
316
317t = s;
318tt = ss;
319
320while (*t != 0)
321 {
322 int c = *t;
323 if (mac_isprint(c) && (allow_tab || c != '\t')) *tt++ = *t++; else
324 {
325 *tt++ = '\\';
326 switch (*t)
327 {
328 case '\n': *tt++ = 'n'; break;
329 case '\r': *tt++ = 'r'; break;
330 case '\b': *tt++ = 'b'; break;
331 case '\v': *tt++ = 'v'; break;
332 case '\f': *tt++ = 'f'; break;
333 case '\t': *tt++ = 't'; break;
334 default: sprintf(CS tt, "%03o", *t); tt += 3; break;
335 }
336 t++;
337 }
338 }
339*tt = 0;
c7396ac5
PP
340return ss;
341}
79fe97d8
PP
342#endif /* COMPILE_UTILITY */
343
c7396ac5
PP
344/*************************************************
345* Undo printing escapes in string *
346*************************************************/
347
348/* This function is the reverse of string_printing2. It searches for
349backslash characters and if any are found, it makes a new copy of the
350string with escape sequences parsed. Otherwise it returns the original
351string.
352
353Arguments:
354 s the input string
355
356Returns: string with printing escapes parsed back
357*/
358
359uschar *
360string_unprinting(uschar *s)
361{
362uschar *p, *q, *r, *ss;
363int len, off;
364
365p = Ustrchr(s, '\\');
366if (!p) return s;
367
368len = Ustrlen(s) + 1;
f3ebb786 369ss = store_get(len, is_tainted(s));
c7396ac5
PP
370
371q = ss;
372off = p - s;
373if (off)
374 {
375 memcpy(q, s, off);
376 q += off;
377 }
378
379while (*p)
380 {
381 if (*p == '\\')
382 {
55414b25 383 *q++ = string_interpret_escape((const uschar **)&p);
823ad74f 384 p++;
c7396ac5
PP
385 }
386 else
387 {
388 r = Ustrchr(p, '\\');
389 if (!r)
390 {
391 off = Ustrlen(p);
392 memcpy(q, p, off);
393 p += off;
394 q += off;
395 break;
396 }
397 else
398 {
399 off = r - p;
400 memcpy(q, p, off);
401 q += off;
402 p = r;
403 }
404 }
405 }
406*q = '\0';
407
059ec3d9
PH
408return ss;
409}
059ec3d9
PH
410
411
412
413
bf13aee1
JH
414#if (defined(HAVE_LOCAL_SCAN) || defined(EXPAND_DLFUNC)) \
415 && !defined(MACRO_PREDEF) && !defined(COMPILE_UTILITY)
059ec3d9
PH
416/*************************************************
417* Copy and save string *
418*************************************************/
419
f3ebb786 420/*
059ec3d9 421Argument: string to copy
f3ebb786 422Returns: copy of string in new store with the same taint status
059ec3d9
PH
423*/
424
425uschar *
e59797e3 426string_copy_function(const uschar *s)
059ec3d9 427{
f3ebb786
JH
428return string_copy_taint(s, is_tainted(s));
429}
430
431/* This function assumes that memcpy() is faster than strcpy().
432As above, but explicitly specifying the result taint status
433*/
434
435uschar *
d48326c0 436string_copy_taint_function(const uschar * s, BOOL tainted)
f3ebb786 437{
059ec3d9 438int len = Ustrlen(s) + 1;
f3ebb786 439uschar *ss = store_get(len, tainted);
059ec3d9
PH
440memcpy(ss, s, len);
441return ss;
442}
443
444
f3ebb786 445
059ec3d9
PH
446/*************************************************
447* Copy and save string, given length *
448*************************************************/
449
450/* It is assumed the data contains no zeros. A zero is added
451onto the end.
452
453Arguments:
454 s string to copy
455 n number of characters
456
457Returns: copy of string in new store
458*/
459
460uschar *
e59797e3 461string_copyn_function(const uschar *s, int n)
059ec3d9 462{
f3ebb786 463uschar *ss = store_get(n + 1, is_tainted(s));
059ec3d9
PH
464Ustrncpy(ss, s, n);
465ss[n] = 0;
466return ss;
467}
e59797e3 468#endif
059ec3d9
PH
469
470
471/*************************************************
e59797e3 472* Copy and save string in malloc'd store *
059ec3d9
PH
473*************************************************/
474
e59797e3 475/* This function assumes that memcpy() is faster than strcpy().
059ec3d9 476
e59797e3
JH
477Argument: string to copy
478Returns: copy of string in new store
059ec3d9
PH
479*/
480
481uschar *
e59797e3 482string_copy_malloc(const uschar *s)
059ec3d9 483{
e59797e3
JH
484int len = Ustrlen(s) + 1;
485uschar *ss = store_malloc(len);
486memcpy(ss, s, len);
059ec3d9
PH
487return ss;
488}
489
490
491
e28326d8
PH
492/*************************************************
493* Copy string if long, inserting newlines *
494*************************************************/
495
496/* If the given string is longer than 75 characters, it is copied, and within
497the copy, certain space characters are converted into newlines.
498
499Argument: pointer to the string
500Returns: pointer to the possibly altered string
501*/
502
503uschar *
504string_split_message(uschar *msg)
505{
506uschar *s, *ss;
507
508if (msg == NULL || Ustrlen(msg) <= 75) return msg;
509s = ss = msg = string_copy(msg);
510
511for (;;)
512 {
513 int i = 0;
514 while (i < 75 && *ss != 0 && *ss != '\n') ss++, i++;
515 if (*ss == 0) break;
516 if (*ss == '\n')
517 s = ++ss;
518 else
519 {
520 uschar *t = ss + 1;
521 uschar *tt = NULL;
522 while (--t > s + 35)
523 {
524 if (*t == ' ')
525 {
526 if (t[-1] == ':') { tt = t; break; }
527 if (tt == NULL) tt = t;
528 }
529 }
530
531 if (tt == NULL) /* Can't split behind - try ahead */
532 {
533 t = ss + 1;
534 while (*t != 0)
535 {
536 if (*t == ' ' || *t == '\n')
537 { tt = t; break; }
538 t++;
539 }
540 }
541
542 if (tt == NULL) break; /* Can't find anywhere to split */
543 *tt = '\n';
544 s = ss = tt+1;
545 }
546 }
547
548return msg;
549}
550
551
552
059ec3d9
PH
553/*************************************************
554* Copy returned DNS domain name, de-escaping *
555*************************************************/
556
557/* If a domain name contains top-bit characters, some resolvers return
558the fully qualified name with those characters turned into escapes. The
559convention is a backslash followed by _decimal_ digits. We convert these
560back into the original binary values. This will be relevant when
561allow_utf8_domains is set true and UTF-8 characters are used in domain
562names. Backslash can also be used to escape other characters, though we
563shouldn't come across them in domain names.
564
565Argument: the domain name string
566Returns: copy of string in new store, de-escaped
567*/
568
569uschar *
570string_copy_dnsdomain(uschar *s)
571{
572uschar *yield;
f3ebb786 573uschar *ss = yield = store_get(Ustrlen(s) + 1, is_tainted(s));
059ec3d9
PH
574
575while (*s != 0)
576 {
577 if (*s != '\\')
578 {
579 *ss++ = *s++;
580 }
581 else if (isdigit(s[1]))
582 {
583 *ss++ = (s[1] - '0')*100 + (s[2] - '0')*10 + s[3] - '0';
584 s += 4;
585 }
586 else if (*(++s) != 0)
587 {
588 *ss++ = *s++;
589 }
590 }
591
592*ss = 0;
593return yield;
594}
595
596
597#ifndef COMPILE_UTILITY
598/*************************************************
599* Copy space-terminated or quoted string *
600*************************************************/
601
602/* This function copies from a string until its end, or until whitespace is
603encountered, unless the string begins with a double quote, in which case the
604terminating quote is sought, and escaping within the string is done. The length
605of a de-quoted string can be no longer than the original, since escaping always
606turns n characters into 1 character.
607
608Argument: pointer to the pointer to the first character, which gets updated
609Returns: the new string
610*/
611
612uschar *
55414b25 613string_dequote(const uschar **sptr)
059ec3d9 614{
55414b25 615const uschar *s = *sptr;
059ec3d9
PH
616uschar *t, *yield;
617
618/* First find the end of the string */
619
620if (*s != '\"')
059ec3d9 621 while (*s != 0 && !isspace(*s)) s++;
059ec3d9
PH
622else
623 {
624 s++;
8c513105 625 while (*s && *s != '\"')
059ec3d9
PH
626 {
627 if (*s == '\\') (void)string_interpret_escape(&s);
628 s++;
629 }
8c513105 630 if (*s) s++;
059ec3d9
PH
631 }
632
633/* Get enough store to copy into */
634
f3ebb786 635t = yield = store_get(s - *sptr + 1, is_tainted(*sptr));
059ec3d9
PH
636s = *sptr;
637
638/* Do the copy */
639
640if (*s != '\"')
059ec3d9 641 while (*s != 0 && !isspace(*s)) *t++ = *s++;
059ec3d9
PH
642else
643 {
644 s++;
645 while (*s != 0 && *s != '\"')
646 {
f3ebb786 647 *t++ = *s == '\\' ? string_interpret_escape(&s) : *s;
059ec3d9
PH
648 s++;
649 }
f3ebb786 650 if (*s) s++;
059ec3d9
PH
651 }
652
653/* Update the pointer and return the terminated copy */
654
655*sptr = s;
656*t = 0;
657return yield;
658}
659#endif /* COMPILE_UTILITY */
660
661
662
663/*************************************************
664* Format a string and save it *
665*************************************************/
666
94759fce 667/* The formatting is done by string_vformat, which checks the length of
13e70f55 668everything. Taint is taken from the worst of the arguments.
059ec3d9
PH
669
670Arguments:
671 format a printf() format - deliberately char * rather than uschar *
672 because it will most usually be a literal string
673 ... arguments for format
674
675Returns: pointer to fresh piece of store containing sprintf'ed string
676*/
677
678uschar *
f3ebb786 679string_sprintf_trc(const char *format, const uschar * func, unsigned line, ...)
059ec3d9 680{
8aa16eb7
JH
681#ifdef COMPILE_UTILITY
682uschar buffer[STRING_SPRINTF_BUFFER_SIZE];
683gstring gs = { .size = STRING_SPRINTF_BUFFER_SIZE, .ptr = 0, .s = buffer };
684gstring * g = &gs;
685unsigned flags = 0;
686#else
687gstring * g = NULL;
688unsigned flags = SVFMT_REBUFFER|SVFMT_EXTEND;
689#endif
d12746bc 690
8aa16eb7 691va_list ap;
f3ebb786 692va_start(ap, line);
8aa16eb7
JH
693g = string_vformat_trc(g, func, line, STRING_SPRINTF_BUFFER_SIZE,
694 flags, format, ap);
059ec3d9 695va_end(ap);
d12746bc 696
f3ebb786 697if (!g)
d12746bc
JH
698 log_write(0, LOG_MAIN|LOG_PANIC_DIE,
699 "string_sprintf expansion was longer than %d; format string was (%s)\n"
f3ebb786
JH
700 " called from %s %d\n",
701 STRING_SPRINTF_BUFFER_SIZE, format, func, line);
d12746bc 702
8aa16eb7
JH
703#ifdef COMPILE_UTILITY
704return string_copyn(g->s, g->ptr);
705#else
f3ebb786
JH
706gstring_release_unused(g);
707return string_from_gstring(g);
8aa16eb7 708#endif
059ec3d9
PH
709}
710
711
712
713/*************************************************
714* Case-independent strncmp() function *
715*************************************************/
716
717/*
718Arguments:
719 s first string
720 t second string
721 n number of characters to compare
722
723Returns: < 0, = 0, or > 0, according to the comparison
724*/
725
726int
1ba28e2b 727strncmpic(const uschar *s, const uschar *t, int n)
059ec3d9
PH
728{
729while (n--)
730 {
731 int c = tolower(*s++) - tolower(*t++);
732 if (c) return c;
733 }
734return 0;
735}
736
737
738/*************************************************
739* Case-independent strcmp() function *
740*************************************************/
741
742/*
743Arguments:
744 s first string
745 t second string
746
747Returns: < 0, = 0, or > 0, according to the comparison
748*/
749
750int
1ba28e2b 751strcmpic(const uschar *s, const uschar *t)
059ec3d9
PH
752{
753while (*s != 0)
754 {
755 int c = tolower(*s++) - tolower(*t++);
756 if (c != 0) return c;
757 }
758return *t;
759}
760
761
762/*************************************************
763* Case-independent strstr() function *
764*************************************************/
765
766/* The third argument specifies whether whitespace is required
767to follow the matched string.
768
769Arguments:
770 s string to search
771 t substring to search for
772 space_follows if TRUE, match only if whitespace follows
773
774Returns: pointer to substring in string, or NULL if not found
775*/
776
777uschar *
778strstric(uschar *s, uschar *t, BOOL space_follows)
779{
780uschar *p = t;
781uschar *yield = NULL;
782int cl = tolower(*p);
783int cu = toupper(*p);
784
785while (*s)
786 {
787 if (*s == cl || *s == cu)
788 {
789 if (yield == NULL) yield = s;
790 if (*(++p) == 0)
791 {
792 if (!space_follows || s[1] == ' ' || s[1] == '\n' ) return yield;
793 yield = NULL;
794 p = t;
795 }
796 cl = tolower(*p);
797 cu = toupper(*p);
798 s++;
799 }
800 else if (yield != NULL)
801 {
802 yield = NULL;
803 p = t;
804 cl = tolower(*p);
805 cu = toupper(*p);
806 }
807 else s++;
808 }
809return NULL;
810}
811
812
813
d12746bc
JH
814#ifdef COMPILE_UTILITY
815/* Dummy version for this function; it should never be called */
816static void
f3ebb786 817gstring_grow(gstring * g, int count)
d12746bc
JH
818{
819assert(FALSE);
820}
821#endif
822
823
824
059ec3d9
PH
825#ifndef COMPILE_UTILITY
826/*************************************************
827* Get next string from separated list *
828*************************************************/
829
830/* Leading and trailing space is removed from each item. The separator in the
831list is controlled by the int pointed to by the separator argument as follows:
832
ec95d1a6
PH
833 If the value is > 0 it is used as the separator. This is typically used for
834 sublists such as slash-separated options. The value is always a printing
835 character.
836
837 (If the value is actually > UCHAR_MAX there is only one item in the list.
059ec3d9
PH
838 This is used for some cases when called via functions that sometimes
839 plough through lists, and sometimes are given single items.)
059ec3d9 840
ec95d1a6
PH
841 If the value is <= 0, the string is inspected for a leading <x, where x is an
842 ispunct() or an iscntrl() character. If found, x is used as the separator. If
843 not found:
844
845 (a) if separator == 0, ':' is used
846 (b) if separator <0, -separator is used
847
848 In all cases the value of the separator that is used is written back to the
849 int so that it is used on subsequent calls as we progress through the list.
850
851A literal ispunct() separator can be represented in an item by doubling, but
852there is no way to include an iscntrl() separator as part of the data.
059ec3d9
PH
853
854Arguments:
855 listptr points to a pointer to the current start of the list; the
856 pointer gets updated to point after the end of the next item
857 separator a pointer to the separator character in an int (see above)
858 buffer where to put a copy of the next string in the list; or
859 NULL if the next string is returned in new memory
860 buflen when buffer is not NULL, the size of buffer; otherwise ignored
861
862Returns: pointer to buffer, containing the next substring,
863 or NULL if no more substrings
864*/
865
866uschar *
55414b25 867string_nextinlist(const uschar **listptr, int *separator, uschar *buffer, int buflen)
059ec3d9 868{
55414b25
JH
869int sep = *separator;
870const uschar *s = *listptr;
ec95d1a6 871BOOL sep_is_special;
059ec3d9 872
8b455685 873if (!s) return NULL;
ec95d1a6
PH
874
875/* This allows for a fixed specified separator to be an iscntrl() character,
876but at the time of implementation, this is never the case. However, it's best
877to be conservative. */
878
879while (isspace(*s) && *s != sep) s++;
880
881/* A change of separator is permitted, so look for a leading '<' followed by an
882allowed character. */
059ec3d9
PH
883
884if (sep <= 0)
885 {
ec95d1a6 886 if (*s == '<' && (ispunct(s[1]) || iscntrl(s[1])))
059ec3d9
PH
887 {
888 sep = s[1];
b72f857f 889 if (*++s) ++s;
ec95d1a6 890 while (isspace(*s) && *s != sep) s++;
059ec3d9
PH
891 }
892 else
8b455685 893 sep = sep ? -sep : ':';
059ec3d9
PH
894 *separator = sep;
895 }
896
ec95d1a6
PH
897/* An empty string has no list elements */
898
8b455685 899if (!*s) return NULL;
059ec3d9 900
ec95d1a6
PH
901/* Note whether whether or not the separator is an iscntrl() character. */
902
903sep_is_special = iscntrl(sep);
904
059ec3d9
PH
905/* Handle the case when a buffer is provided. */
906
617d3932 907if (buffer)
059ec3d9 908 {
d4ff61d1 909 int p = 0;
8b455685 910 for (; *s; s++)
059ec3d9 911 {
ec95d1a6 912 if (*s == sep && (*(++s) != sep || sep_is_special)) break;
059ec3d9
PH
913 if (p < buflen - 1) buffer[p++] = *s;
914 }
915 while (p > 0 && isspace(buffer[p-1])) p--;
8b455685 916 buffer[p] = '\0';
059ec3d9
PH
917 }
918
919/* Handle the case when a buffer is not provided. */
920
921else
922 {
acec9514 923 gstring * g = NULL;
ec95d1a6 924
059ec3d9 925 /* We know that *s != 0 at this point. However, it might be pointing to a
ec95d1a6
PH
926 separator, which could indicate an empty string, or (if an ispunct()
927 character) could be doubled to indicate a separator character as data at the
928 start of a string. Avoid getting working memory for an empty item. */
059ec3d9
PH
929
930 if (*s == sep)
931 {
932 s++;
ec95d1a6
PH
933 if (*s != sep || sep_is_special)
934 {
935 *listptr = s;
936 return string_copy(US"");
937 }
059ec3d9
PH
938 }
939
ec95d1a6
PH
940 /* Not an empty string; the first character is guaranteed to be a data
941 character. */
942
943 for (;;)
059ec3d9 944 {
d7978c0f
JH
945 const uschar * ss;
946 for (ss = s + 1; *ss && *ss != sep; ) ss++;
acec9514 947 g = string_catn(g, s, ss-s);
ec95d1a6 948 s = ss;
8b455685 949 if (!*s || *++s != sep || sep_is_special) break;
059ec3d9 950 }
acec9514
JH
951 while (g->ptr > 0 && isspace(g->s[g->ptr-1])) g->ptr--;
952 buffer = string_from_gstring(g);
e59797e3 953 gstring_release_unused(g);
059ec3d9
PH
954 }
955
956/* Update the current pointer and return the new string */
957
958*listptr = s;
959return buffer;
960}
059ec3d9
PH
961
962
4226691b
JH
963static const uschar *
964Ustrnchr(const uschar * s, int c, unsigned * len)
965{
966unsigned siz = *len;
967while (siz)
968 {
969 if (!*s) return NULL;
970 if (*s == c)
971 {
972 *len = siz;
973 return s;
974 }
975 s++;
976 siz--;
977 }
978return NULL;
979}
980
981
76146973 982/************************************************
1d9ddac9 983* Add element to separated list *
76146973 984************************************************/
4226691b
JH
985/* This function is used to build a list, returning an allocated null-terminated
986growable string. The given element has any embedded separator characters
76146973
JH
987doubled.
988
4226691b
JH
989Despite having the same growable-string interface as string_cat() the list is
990always returned null-terminated.
991
76146973 992Arguments:
acec9514 993 list expanding-string for the list that is being built, or NULL
76146973 994 if this is a new list that has no contents yet
4c04137d
JS
995 sep list separator character
996 ele new element to be appended to the list
76146973
JH
997
998Returns: pointer to the start of the list, changed if copied for expansion.
999*/
1000
acec9514
JH
1001gstring *
1002string_append_listele(gstring * list, uschar sep, const uschar * ele)
76146973 1003{
76146973
JH
1004uschar * sp;
1005
acec9514
JH
1006if (list && list->ptr)
1007 list = string_catn(list, &sep, 1);
76146973 1008
e3dd1d67 1009while((sp = Ustrchr(ele, sep)))
76146973 1010 {
acec9514
JH
1011 list = string_catn(list, ele, sp-ele+1);
1012 list = string_catn(list, &sep, 1);
76146973
JH
1013 ele = sp+1;
1014 }
acec9514
JH
1015list = string_cat(list, ele);
1016(void) string_from_gstring(list);
4226691b 1017return list;
76146973 1018}
00ba27c5
JH
1019
1020
acec9514
JH
1021gstring *
1022string_append_listele_n(gstring * list, uschar sep, const uschar * ele,
1023 unsigned len)
00ba27c5 1024{
00ba27c5
JH
1025const uschar * sp;
1026
acec9514
JH
1027if (list && list->ptr)
1028 list = string_catn(list, &sep, 1);
00ba27c5
JH
1029
1030while((sp = Ustrnchr(ele, sep, &len)))
1031 {
acec9514
JH
1032 list = string_catn(list, ele, sp-ele+1);
1033 list = string_catn(list, &sep, 1);
00ba27c5
JH
1034 ele = sp+1;
1035 len--;
1036 }
acec9514
JH
1037list = string_catn(list, ele, len);
1038(void) string_from_gstring(list);
4226691b 1039return list;
00ba27c5 1040}
76146973
JH
1041
1042
059ec3d9 1043
bce15b62
JH
1044/* A slightly-bogus listmaker utility; the separator is a string so
1045can be multiple chars - there is no checking for the element content
1046containing any of the separator. */
1047
1048gstring *
1049string_append2_listele_n(gstring * list, const uschar * sepstr,
1050 const uschar * ele, unsigned len)
1051{
bce15b62
JH
1052if (list && list->ptr)
1053 list = string_cat(list, sepstr);
1054
1055list = string_catn(list, ele, len);
1056(void) string_from_gstring(list);
1057return list;
1058}
1059
1060
1061
acec9514 1062/************************************************/
f3ebb786
JH
1063/* Add more space to a growable-string. The caller should check
1064first if growth is required. The gstring struct is modified on
1065return; specifically, the string-base-pointer may have been changed.
d12746bc
JH
1066
1067Arguments:
1068 g the growable-string
f3ebb786 1069 count amount needed for g->ptr to increase by
938593e9
JH
1070*/
1071
1072static void
f3ebb786 1073gstring_grow(gstring * g, int count)
acec9514 1074{
f3ebb786 1075int p = g->ptr;
acec9514 1076int oldsize = g->size;
f3ebb786 1077BOOL tainted = is_tainted(g->s);
acec9514
JH
1078
1079/* Mostly, string_cat() is used to build small strings of a few hundred
1080characters at most. There are times, however, when the strings are very much
1081longer (for example, a lookup that returns a vast number of alias addresses).
1082To try to keep things reasonable, we use increments whose size depends on the
1083existing length of the string. */
1084
1085unsigned inc = oldsize < 4096 ? 127 : 1023;
f3ebb786
JH
1086
1087if (count <= 0) return;
1088g->size = (p + count + inc + 1) & ~inc; /* one for a NUL */
acec9514
JH
1089
1090/* Try to extend an existing allocation. If the result of calling
1091store_extend() is false, either there isn't room in the current memory block,
1092or this string is not the top item on the dynamic store stack. We then have
1093to get a new chunk of store and copy the old string. When building large
1094strings, it is helpful to call store_release() on the old string, to release
1095memory blocks that have become empty. (The block will be freed if the string
1096is at its start.) However, we can do this only if we know that the old string
1097was the last item on the dynamic memory stack. This is the case if it matches
1098store_last_get. */
1099
f3ebb786
JH
1100if (!store_extend(g->s, tainted, oldsize, g->size))
1101 g->s = store_newblock(g->s, tainted, g->size, p);
acec9514
JH
1102}
1103
1104
1105
d12746bc
JH
1106/*************************************************
1107* Add chars to string *
1108*************************************************/
059ec3d9
PH
1109/* This function is used when building up strings of unknown length. Room is
1110always left for a terminating zero to be added to the string that is being
1111built. This function does not require the string that is being added to be NUL
1112terminated, because the number of characters to add is given explicitly. It is
1113sometimes called to extract parts of other strings.
1114
1115Arguments:
1116 string points to the start of the string that is being built, or NULL
1117 if this is a new string that has no contents yet
059ec3d9
PH
1118 s points to characters to add
1119 count count of characters to add; must not exceed the length of s, if s
42055a33 1120 is a C string.
059ec3d9 1121
059ec3d9
PH
1122Returns: pointer to the start of the string, changed if copied for expansion.
1123 Note that a NUL is not added, though space is left for one. This is
1124 because string_cat() is often called multiple times to build up a
1125 string - there's no point adding the NUL till the end.
a1b8a755 1126
059ec3d9 1127*/
96f5fe4c 1128/* coverity[+alloc] */
059ec3d9 1129
acec9514
JH
1130gstring *
1131string_catn(gstring * g, const uschar *s, int count)
059ec3d9 1132{
acec9514 1133int p;
f3ebb786 1134BOOL srctaint = is_tainted(s);
059ec3d9 1135
acec9514 1136if (!g)
059ec3d9 1137 {
acec9514
JH
1138 unsigned inc = count < 4096 ? 127 : 1023;
1139 unsigned size = ((count + inc) & ~inc) + 1;
f3ebb786 1140 g = string_get_tainted(size, srctaint);
059ec3d9 1141 }
f3ebb786
JH
1142else if (srctaint && !is_tainted(g->s))
1143 gstring_rebuffer(g);
059ec3d9 1144
acec9514
JH
1145p = g->ptr;
1146if (p + count >= g->size)
f3ebb786 1147 gstring_grow(g, count);
acec9514 1148
059ec3d9
PH
1149/* Because we always specify the exact number of characters to copy, we can
1150use memcpy(), which is likely to be more efficient than strncopy() because the
acec9514 1151latter has to check for zero bytes. */
059ec3d9 1152
acec9514
JH
1153memcpy(g->s + p, s, count);
1154g->ptr = p + count;
1155return g;
059ec3d9 1156}
c3aefacc
HSHR
1157
1158
acec9514
JH
1159gstring *
1160string_cat(gstring *string, const uschar *s)
c2f669a4 1161{
acec9514 1162return string_catn(string, s, Ustrlen(s));
c2f669a4 1163}
059ec3d9
PH
1164
1165
1166
059ec3d9
PH
1167/*************************************************
1168* Append strings to another string *
1169*************************************************/
1170
1171/* This function can be used to build a string from many other strings.
1172It calls string_cat() to do the dirty work.
1173
1174Arguments:
acec9514 1175 string expanding-string that is being built, or NULL
059ec3d9 1176 if this is a new string that has no contents yet
059ec3d9
PH
1177 count the number of strings to append
1178 ... "count" uschar* arguments, which must be valid zero-terminated
1179 C strings
1180
1181Returns: pointer to the start of the string, changed if copied for expansion.
1182 The string is not zero-terminated - see string_cat() above.
1183*/
1184
acec9514
JH
1185__inline__ gstring *
1186string_append(gstring *string, int count, ...)
059ec3d9
PH
1187{
1188va_list ap;
059ec3d9
PH
1189
1190va_start(ap, count);
acec9514 1191while (count-- > 0)
059ec3d9
PH
1192 {
1193 uschar *t = va_arg(ap, uschar *);
acec9514 1194 string = string_cat(string, t);
059ec3d9
PH
1195 }
1196va_end(ap);
1197
1198return string;
1199}
1200#endif
1201
1202
1203
1204/*************************************************
1205* Format a string with length checks *
1206*************************************************/
1207
1208/* This function is used to format a string with checking of the length of the
1209output for all conversions. It protects Exim from absent-mindedness when
1210calling functions like debug_printf and string_sprintf, and elsewhere. There
1211are two different entry points to what is actually the same function, depending
1212on whether the variable length list of data arguments are given explicitly or
1213as a va_list item.
1214
1215The formats are the usual printf() ones, with some omissions (never used) and
c0b9d3e8 1216three additions for strings: %S forces lower case, %T forces upper case, and
acec9514 1217%#s or %#S prints nothing for a NULL string. Without the # "NULL" is printed
c0b9d3e8
JH
1218(useful in debugging). There is also the addition of %D and %M, which insert
1219the date in the form used for datestamped log files.
059ec3d9
PH
1220
1221Arguments:
1222 buffer a buffer in which to put the formatted string
1223 buflen the length of the buffer
1224 format the format string - deliberately char * and not uschar *
1225 ... or ap variable list of supplementary arguments
1226
1227Returns: TRUE if the result fitted in the buffer
1228*/
1229
1230BOOL
f3ebb786
JH
1231string_format_trc(uschar * buffer, int buflen,
1232 const uschar * func, unsigned line, const char * format, ...)
059ec3d9 1233{
d12746bc 1234gstring g = { .size = buflen, .ptr = 0, .s = buffer }, *gp;
059ec3d9
PH
1235va_list ap;
1236va_start(ap, format);
f3ebb786
JH
1237gp = string_vformat_trc(&g, func, line, STRING_SPRINTF_BUFFER_SIZE,
1238 0, format, ap);
059ec3d9 1239va_end(ap);
d12746bc
JH
1240g.s[g.ptr] = '\0';
1241return !!gp;
059ec3d9
PH
1242}
1243
1244
d12746bc 1245
f3ebb786
JH
1246/* Copy the content of a string to tainted memory */
1247static void
1248gstring_rebuffer(gstring * g)
1249{
1250uschar * s = store_get(g->size, TRUE);
1251memcpy(s, g->s, g->ptr);
1252g->s = s;
1253}
1254
d12746bc
JH
1255
1256
f3ebb786 1257/* Build or append to a growing-string, sprintf-style.
d12746bc 1258
b273058b
JH
1259Arguments:
1260 g a growable-string
1261 func called-from function name, for debug
1262 line called-from file line number, for debug
1263 limit maximum string size
1264 flags see below
1265 format printf-like format string
1266 ap variable-args pointer
1267
1268Flags:
1269 SVFMT_EXTEND buffer can be created or exteded as needed
1270 SVFMT_REBUFFER buffer can be recopied to tainted mem as needed
1271 SVFMT_TAINT_NOCHK do not check inputs for taint
1272
f3ebb786
JH
1273If the "extend" flag is true, the string passed in can be NULL,
1274empty, or non-empty. Growing is subject to an overall limit given
b273058b 1275by the limit argument.
d12746bc 1276
f3ebb786 1277If the "extend" flag is false, the string passed in may not be NULL,
d12746bc
JH
1278will not be grown, and is usable in the original place after return.
1279The return value can be NULL to signify overflow.
1280
adc4ecf9
JH
1281Returns the possibly-new (if copy for growth or taint-handling was needed)
1282string, not nul-terminated.
d12746bc
JH
1283*/
1284
1285gstring *
f3ebb786
JH
1286string_vformat_trc(gstring * g, const uschar * func, unsigned line,
1287 unsigned size_limit, unsigned flags, const char *format, va_list ap)
059ec3d9 1288{
d12746bc
JH
1289enum ltypes { L_NORMAL=1, L_SHORT=2, L_LONG=3, L_LONGLONG=4, L_LONGDOUBLE=5, L_SIZE=6 };
1290
f3ebb786 1291int width, precision, off, lim, need;
d12746bc 1292const char * fp = format; /* Deliberately not unsigned */
f3ebb786 1293BOOL dest_tainted = FALSE;
b1c749bb 1294
d12746bc
JH
1295string_datestamp_offset = -1; /* Datestamp not inserted */
1296string_datestamp_length = 0; /* Datestamp not inserted */
1297string_datestamp_type = 0; /* Datestamp not inserted */
059ec3d9 1298
d12746bc 1299#ifdef COMPILE_UTILITY
f3ebb786 1300assert(!(flags & SVFMT_EXTEND));
d12746bc
JH
1301assert(g);
1302#else
1303
1304/* Ensure we have a string, to save on checking later */
1305if (!g) g = string_get(16);
f3ebb786
JH
1306else if (!(flags & SVFMT_TAINT_NOCHK)) dest_tainted = is_tainted(g->s);
1307
1308if (!(flags & SVFMT_TAINT_NOCHK) && !dest_tainted && is_tainted(format))
1309 {
aaabfafe 1310#ifndef MACRO_PREDEF
f3ebb786
JH
1311 if (!(flags & SVFMT_REBUFFER))
1312 die_tainted(US"string_vformat", func, line);
aaabfafe 1313#endif
f3ebb786
JH
1314 gstring_rebuffer(g);
1315 dest_tainted = TRUE;
1316 }
d12746bc
JH
1317#endif /*!COMPILE_UTILITY*/
1318
1319lim = g->size - 1; /* leave one for a nul */
1320off = g->ptr; /* remember initial offset in gstring */
059ec3d9
PH
1321
1322/* Scan the format and handle the insertions */
1323
d12746bc 1324while (*fp)
059ec3d9 1325 {
b1c749bb 1326 int length = L_NORMAL;
059ec3d9
PH
1327 int *nptr;
1328 int slen;
d12746bc
JH
1329 const char *null = "NULL"; /* ) These variables */
1330 const char *item_start, *s; /* ) are deliberately */
1331 char newformat[16]; /* ) not unsigned */
1332 char * gp = CS g->s + g->ptr; /* ) */
059ec3d9
PH
1333
1334 /* Non-% characters just get copied verbatim */
1335
1336 if (*fp != '%')
1337 {
d12746bc 1338 /* Avoid string_copyn() due to COMPILE_UTILITY */
f3ebb786 1339 if ((need = g->ptr + 1) > lim)
1100a343 1340 {
f3ebb786
JH
1341 if (!(flags & SVFMT_EXTEND) || need > size_limit) return NULL;
1342 gstring_grow(g, 1);
1100a343
JH
1343 lim = g->size - 1;
1344 }
d12746bc 1345 g->s[g->ptr++] = (uschar) *fp++;
059ec3d9
PH
1346 continue;
1347 }
1348
1349 /* Deal with % characters. Pick off the width and precision, for checking
1350 strings, skipping over the flag and modifier characters. */
1351
1352 item_start = fp;
1353 width = precision = -1;
1354
1355 if (strchr("-+ #0", *(++fp)) != NULL)
1356 {
1357 if (*fp == '#') null = "";
1358 fp++;
1359 }
1360
1361 if (isdigit((uschar)*fp))
1362 {
1363 width = *fp++ - '0';
1364 while (isdigit((uschar)*fp)) width = width * 10 + *fp++ - '0';
1365 }
1366 else if (*fp == '*')
1367 {
1368 width = va_arg(ap, int);
1369 fp++;
1370 }
1371
1372 if (*fp == '.')
059ec3d9
PH
1373 if (*(++fp) == '*')
1374 {
1375 precision = va_arg(ap, int);
1376 fp++;
1377 }
1378 else
d12746bc
JH
1379 for (precision = 0; isdigit((uschar)*fp); fp++)
1380 precision = precision*10 + *fp - '0';
059ec3d9 1381
91a246f6 1382 /* Skip over 'h', 'L', 'l', 'll' and 'z', remembering the item length */
b1c749bb
PH
1383
1384 if (*fp == 'h')
1385 { fp++; length = L_SHORT; }
1386 else if (*fp == 'L')
1387 { fp++; length = L_LONGDOUBLE; }
1388 else if (*fp == 'l')
b1c749bb 1389 if (fp[1] == 'l')
d12746bc 1390 { fp += 2; length = L_LONGLONG; }
b1c749bb 1391 else
d12746bc 1392 { fp++; length = L_LONG; }
91a246f6
PP
1393 else if (*fp == 'z')
1394 { fp++; length = L_SIZE; }
059ec3d9
PH
1395
1396 /* Handle each specific format type. */
1397
1398 switch (*fp++)
1399 {
1400 case 'n':
d12746bc
JH
1401 nptr = va_arg(ap, int *);
1402 *nptr = g->ptr - off;
1403 break;
059ec3d9
PH
1404
1405 case 'd':
1406 case 'o':
1407 case 'u':
1408 case 'x':
1409 case 'X':
d12746bc 1410 width = length > L_LONG ? 24 : 12;
f3ebb786 1411 if ((need = g->ptr + width) > lim)
1100a343 1412 {
f3ebb786
JH
1413 if (!(flags & SVFMT_EXTEND) || need >= size_limit) return NULL;
1414 gstring_grow(g, width);
1100a343
JH
1415 lim = g->size - 1;
1416 gp = CS g->s + g->ptr;
1417 }
d12746bc
JH
1418 strncpy(newformat, item_start, fp - item_start);
1419 newformat[fp - item_start] = 0;
b1c749bb 1420
d12746bc
JH
1421 /* Short int is promoted to int when passing through ..., so we must use
1422 int for va_arg(). */
b1c749bb 1423
d12746bc
JH
1424 switch(length)
1425 {
1426 case L_SHORT:
1427 case L_NORMAL:
1428 g->ptr += sprintf(gp, newformat, va_arg(ap, int)); break;
1429 case L_LONG:
1430 g->ptr += sprintf(gp, newformat, va_arg(ap, long int)); break;
1431 case L_LONGLONG:
1432 g->ptr += sprintf(gp, newformat, va_arg(ap, LONGLONG_T)); break;
1433 case L_SIZE:
1434 g->ptr += sprintf(gp, newformat, va_arg(ap, size_t)); break;
1435 }
1436 break;
059ec3d9
PH
1437
1438 case 'p':
2e8db779
JH
1439 {
1440 void * ptr;
f3ebb786 1441 if ((need = g->ptr + 24) > lim)
1100a343 1442 {
f3ebb786
JH
1443 if (!(flags & SVFMT_EXTEND || need >= size_limit)) return NULL;
1444 gstring_grow(g, 24);
1100a343
JH
1445 lim = g->size - 1;
1446 gp = CS g->s + g->ptr;
1447 }
81f358da
JH
1448 /* sprintf() saying "(nil)" for a null pointer seems unreliable.
1449 Handle it explicitly. */
2e8db779
JH
1450 if ((ptr = va_arg(ap, void *)))
1451 {
1452 strncpy(newformat, item_start, fp - item_start);
1453 newformat[fp - item_start] = 0;
d12746bc 1454 g->ptr += sprintf(gp, newformat, ptr);
2e8db779
JH
1455 }
1456 else
d12746bc 1457 g->ptr += sprintf(gp, "(nil)");
2e8db779 1458 }
059ec3d9
PH
1459 break;
1460
1461 /* %f format is inherently insecure if the numbers that it may be
870f6ba8
TF
1462 handed are unknown (e.g. 1e300). However, in Exim, %f is used for
1463 printing load averages, and these are actually stored as integers
1464 (load average * 1000) so the size of the numbers is constrained.
1465 It is also used for formatting sending rates, where the simplicity
1466 of the format prevents overflow. */
059ec3d9
PH
1467
1468 case 'f':
1469 case 'e':
1470 case 'E':
1471 case 'g':
1472 case 'G':
d12746bc 1473 if (precision < 0) precision = 6;
f3ebb786 1474 if ((need = g->ptr + precision + 8) > lim)
1100a343 1475 {
f3ebb786
JH
1476 if (!(flags & SVFMT_EXTEND || need >= size_limit)) return NULL;
1477 gstring_grow(g, precision+8);
1100a343
JH
1478 lim = g->size - 1;
1479 gp = CS g->s + g->ptr;
1480 }
d12746bc
JH
1481 strncpy(newformat, item_start, fp - item_start);
1482 newformat[fp-item_start] = 0;
1483 if (length == L_LONGDOUBLE)
1484 g->ptr += sprintf(gp, newformat, va_arg(ap, long double));
1485 else
1486 g->ptr += sprintf(gp, newformat, va_arg(ap, double));
1487 break;
059ec3d9
PH
1488
1489 /* String types */
1490
1491 case '%':
f3ebb786 1492 if ((need = g->ptr + 1) > lim)
1100a343 1493 {
f3ebb786
JH
1494 if (!(flags & SVFMT_EXTEND || need >= size_limit)) return NULL;
1495 gstring_grow(g, 1);
1100a343
JH
1496 lim = g->size - 1;
1497 }
d12746bc
JH
1498 g->s[g->ptr++] = (uschar) '%';
1499 break;
059ec3d9
PH
1500
1501 case 'c':
f3ebb786 1502 if ((need = g->ptr + 1) > lim)
1100a343 1503 {
f3ebb786
JH
1504 if (!(flags & SVFMT_EXTEND || need >= size_limit)) return NULL;
1505 gstring_grow(g, 1);
1100a343
JH
1506 lim = g->size - 1;
1507 }
d12746bc
JH
1508 g->s[g->ptr++] = (uschar) va_arg(ap, int);
1509 break;
059ec3d9 1510
f1e5fef5 1511 case 'D': /* Insert daily datestamp for log file names */
d12746bc
JH
1512 s = CS tod_stamp(tod_log_datestamp_daily);
1513 string_datestamp_offset = g->ptr; /* Passed back via global */
1514 string_datestamp_length = Ustrlen(s); /* Passed back via global */
1515 string_datestamp_type = tod_log_datestamp_daily;
1516 slen = string_datestamp_length;
1517 goto INSERT_STRING;
f1e5fef5
PP
1518
1519 case 'M': /* Insert monthly datestamp for log file names */
d12746bc
JH
1520 s = CS tod_stamp(tod_log_datestamp_monthly);
1521 string_datestamp_offset = g->ptr; /* Passed back via global */
1522 string_datestamp_length = Ustrlen(s); /* Passed back via global */
1523 string_datestamp_type = tod_log_datestamp_monthly;
1524 slen = string_datestamp_length;
1525 goto INSERT_STRING;
059ec3d9
PH
1526
1527 case 's':
1528 case 'S': /* Forces *lower* case */
c0b9d3e8 1529 case 'T': /* Forces *upper* case */
d12746bc 1530 s = va_arg(ap, char *);
059ec3d9 1531
d12746bc
JH
1532 if (!s) s = null;
1533 slen = Ustrlen(s);
059ec3d9 1534
f3ebb786
JH
1535 if (!(flags & SVFMT_TAINT_NOCHK) && !dest_tainted && is_tainted(s))
1536 if (flags & SVFMT_REBUFFER)
1537 {
1538 gstring_rebuffer(g);
1539 gp = CS g->s + g->ptr;
1540 dest_tainted = TRUE;
1541 }
aaabfafe 1542#ifndef MACRO_PREDEF
f3ebb786
JH
1543 else
1544 die_tainted(US"string_vformat", func, line);
aaabfafe 1545#endif
f3ebb786 1546
f1e5fef5
PP
1547 INSERT_STRING: /* Come to from %D or %M above */
1548
059ec3d9 1549 {
d12746bc 1550 BOOL truncated = FALSE;
059ec3d9 1551
d12746bc
JH
1552 /* If the width is specified, check that there is a precision
1553 set; if not, set it to the width to prevent overruns of long
1554 strings. */
059ec3d9 1555
d12746bc
JH
1556 if (width >= 0)
1557 {
1558 if (precision < 0) precision = width;
1559 }
059ec3d9 1560
d12746bc
JH
1561 /* If a width is not specified and the precision is specified, set
1562 the width to the precision, or the string length if shorted. */
059ec3d9 1563
d12746bc
JH
1564 else if (precision >= 0)
1565 width = precision < slen ? precision : slen;
059ec3d9 1566
d12746bc 1567 /* If neither are specified, set them both to the string length. */
059ec3d9 1568
d12746bc
JH
1569 else
1570 width = precision = slen;
1571
f3ebb786 1572 if ((need = g->ptr + width) >= size_limit || !(flags & SVFMT_EXTEND))
d12746bc
JH
1573 {
1574 if (g->ptr == lim) return NULL;
f3ebb786 1575 if (need > lim)
d12746bc
JH
1576 {
1577 truncated = TRUE;
1578 width = precision = lim - g->ptr - 1;
1579 if (width < 0) width = 0;
1580 if (precision < 0) precision = 0;
1581 }
1582 }
f3ebb786 1583 else if (need > lim)
1100a343 1584 {
f3ebb786 1585 gstring_grow(g, width);
1100a343
JH
1586 lim = g->size - 1;
1587 gp = CS g->s + g->ptr;
1588 }
d12746bc
JH
1589
1590 g->ptr += sprintf(gp, "%*.*s", width, precision, s);
1591 if (fp[-1] == 'S')
1592 while (*gp) { *gp = tolower(*gp); gp++; }
1593 else if (fp[-1] == 'T')
1594 while (*gp) { *gp = toupper(*gp); gp++; }
1595
1596 if (truncated) return NULL;
1597 break;
059ec3d9 1598 }
059ec3d9
PH
1599
1600 /* Some things are never used in Exim; also catches junk. */
1601
1602 default:
d12746bc
JH
1603 strncpy(newformat, item_start, fp - item_start);
1604 newformat[fp-item_start] = 0;
1605 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "string_format: unsupported type "
1606 "in \"%s\" in \"%s\"", newformat, format);
1607 break;
059ec3d9
PH
1608 }
1609 }
1610
f3ebb786
JH
1611if (g->ptr > g->size)
1612 log_write(0, LOG_MAIN|LOG_PANIC_DIE,
1613 "string_format internal error: caller %s %d", func, line);
d12746bc
JH
1614return g;
1615}
059ec3d9 1616
059ec3d9 1617
d12746bc
JH
1618
1619#ifndef COMPILE_UTILITY
059ec3d9
PH
1620/*************************************************
1621* Generate an "open failed" message *
1622*************************************************/
1623
1624/* This function creates a message after failure to open a file. It includes a
1625string supplied as data, adds the strerror() text, and if the failure was
1626"Permission denied", reads and includes the euid and egid.
1627
1628Arguments:
1629 eno the value of errno after the failure
1630 format a text format string - deliberately not uschar *
1631 ... arguments for the format string
1632
1633Returns: a message, in dynamic store
1634*/
1635
1636uschar *
f3ebb786
JH
1637string_open_failed_trc(int eno, const uschar * func, unsigned line,
1638 const char *format, ...)
059ec3d9
PH
1639{
1640va_list ap;
d12746bc 1641gstring * g = string_get(1024);
059ec3d9 1642
d12746bc 1643g = string_catn(g, US"failed to open ", 15);
059ec3d9
PH
1644
1645/* Use the checked formatting routine to ensure that the buffer
1646does not overflow. It should not, since this is called only for internally
1647specified messages. If it does, the message just gets truncated, and there
1648doesn't seem much we can do about that. */
1649
d12746bc 1650va_start(ap, format);
f3ebb786
JH
1651(void) string_vformat_trc(g, func, line, STRING_SPRINTF_BUFFER_SIZE,
1652 0, format, ap);
d12746bc 1653string_from_gstring(g);
e59797e3 1654gstring_release_unused(g);
cb570b5e 1655va_end(ap);
059ec3d9 1656
d12746bc
JH
1657return eno == EACCES
1658 ? string_sprintf("%s: %s (euid=%ld egid=%ld)", g->s, strerror(eno),
1659 (long int)geteuid(), (long int)getegid())
1660 : string_sprintf("%s: %s", g->s, strerror(eno));
059ec3d9
PH
1661}
1662#endif /* COMPILE_UTILITY */
1663
1664
1665
059ec3d9
PH
1666
1667
bc3c7bb7
HSHR
1668#ifndef COMPILE_UTILITY
1669/* qsort(3), currently used to sort the environment variables
1670for -bP environment output, needs a function to compare two pointers to string
1671pointers. Here it is. */
1672
1673int
84bbb4d8 1674string_compare_by_pointer(const void *a, const void *b)
bc3c7bb7 1675{
35a5627d 1676return Ustrcmp(* CUSS a, * CUSS b);
bc3c7bb7
HSHR
1677}
1678#endif /* COMPILE_UTILITY */
059ec3d9
PH
1679
1680
1681
d12746bc 1682
059ec3d9
PH
1683/*************************************************
1684**************************************************
1685* Stand-alone test program *
1686**************************************************
1687*************************************************/
1688
1689#ifdef STAND_ALONE
1690int main(void)
1691{
1692uschar buffer[256];
1693
1694printf("Testing is_ip_address\n");
1695
1696while (fgets(CS buffer, sizeof(buffer), stdin) != NULL)
1697 {
1698 int offset;
1699 buffer[Ustrlen(buffer) - 1] = 0;
1700 printf("%d\n", string_is_ip_address(buffer, NULL));
1701 printf("%d %d %s\n", string_is_ip_address(buffer, &offset), offset, buffer);
1702 }
1703
1704printf("Testing string_nextinlist\n");
1705
1706while (fgets(CS buffer, sizeof(buffer), stdin) != NULL)
1707 {
1708 uschar *list = buffer;
1709 uschar *lp1, *lp2;
1710 uschar item[256];
1711 int sep1 = 0;
1712 int sep2 = 0;
1713
1714 if (*list == '<')
1715 {
1716 sep1 = sep2 = list[1];
1717 list += 2;
1718 }
1719
1720 lp1 = lp2 = list;
1721 for (;;)
1722 {
1723 uschar *item1 = string_nextinlist(&lp1, &sep1, item, sizeof(item));
1724 uschar *item2 = string_nextinlist(&lp2, &sep2, NULL, 0);
1725
1726 if (item1 == NULL && item2 == NULL) break;
1727 if (item == NULL || item2 == NULL || Ustrcmp(item1, item2) != 0)
1728 {
1729 printf("***ERROR\nitem1=\"%s\"\nitem2=\"%s\"\n",
1730 (item1 == NULL)? "NULL" : CS item1,
1731 (item2 == NULL)? "NULL" : CS item2);
1732 break;
1733 }
1734 else printf(" \"%s\"\n", CS item1);
1735 }
1736 }
1737
1738/* This is a horrible lash-up, but it serves its purpose. */
1739
1740printf("Testing string_format\n");
1741
1742while (fgets(CS buffer, sizeof(buffer), stdin) != NULL)
1743 {
1744 void *args[3];
ed72ace5 1745 long long llargs[3];
059ec3d9
PH
1746 double dargs[3];
1747 int dflag = 0;
ed72ace5 1748 int llflag = 0;
059ec3d9
PH
1749 int n = 0;
1750 int count;
1751 int countset = 0;
1752 uschar format[256];
1753 uschar outbuf[256];
1754 uschar *s;
1755 buffer[Ustrlen(buffer) - 1] = 0;
1756
1757 s = Ustrchr(buffer, ',');
1758 if (s == NULL) s = buffer + Ustrlen(buffer);
1759
1760 Ustrncpy(format, buffer, s - buffer);
1761 format[s-buffer] = 0;
1762
1763 if (*s == ',') s++;
1764
1765 while (*s != 0)
1766 {
1767 uschar *ss = s;
1768 s = Ustrchr(ss, ',');
1769 if (s == NULL) s = ss + Ustrlen(ss);
1770
1771 if (isdigit(*ss))
1772 {
1773 Ustrncpy(outbuf, ss, s-ss);
1774 if (Ustrchr(outbuf, '.') != NULL)
1775 {
1776 dflag = 1;
1777 dargs[n++] = Ustrtod(outbuf, NULL);
1778 }
ed72ace5
PH
1779 else if (Ustrstr(outbuf, "ll") != NULL)
1780 {
1781 llflag = 1;
1782 llargs[n++] = strtoull(CS outbuf, NULL, 10);
1783 }
059ec3d9
PH
1784 else
1785 {
1786 args[n++] = (void *)Uatoi(outbuf);
1787 }
1788 }
1789
1790 else if (Ustrcmp(ss, "*") == 0)
1791 {
1792 args[n++] = (void *)(&count);
1793 countset = 1;
1794 }
1795
1796 else
1797 {
1798 uschar *sss = malloc(s - ss + 1);
1799 Ustrncpy(sss, ss, s-ss);
1800 args[n++] = sss;
1801 }
1802
1803 if (*s == ',') s++;
1804 }
1805
ed72ace5
PH
1806 if (!dflag && !llflag)
1807 printf("%s\n", string_format(outbuf, sizeof(outbuf), CS format,
1808 args[0], args[1], args[2])? "True" : "False");
1809
1810 else if (dflag)
1811 printf("%s\n", string_format(outbuf, sizeof(outbuf), CS format,
1812 dargs[0], dargs[1], dargs[2])? "True" : "False");
059ec3d9
PH
1813
1814 else printf("%s\n", string_format(outbuf, sizeof(outbuf), CS format,
ed72ace5 1815 llargs[0], llargs[1], llargs[2])? "True" : "False");
059ec3d9
PH
1816
1817 printf("%s\n", CS outbuf);
1818 if (countset) printf("count=%d\n", count);
1819 }
1820
1821return 0;
1822}
1823#endif
1824
1825/* End of string.c */