/************************************************* * Exim - an Internet mail transport agent * *************************************************/ /* Copyright (c) University of Cambridge 1995 - 2014 */ /* See the file NOTICE for conditions of use and distribution. */ /* Miscellaneous string-handling functions. Some are not required for utilities and tests, and are cut out by the COMPILE_UTILITY macro. */ #include "exim.h" #ifndef COMPILE_UTILITY /************************************************* * Test for IP address * *************************************************/ /* This used just to be a regular expression, but with IPv6 things are a bit more complicated. If the address contains a colon, it is assumed to be a v6 address (assuming HAVE_IPV6 is set). If a mask is permitted and one is present, and maskptr is not NULL, its offset is placed there. Arguments: s a string maskptr NULL if no mask is permitted to follow otherwise, points to an int where the offset of '/' is placed if there is no / followed by trailing digits, *maskptr is set 0 Returns: 0 if the string is not a textual representation of an IP address 4 if it is an IPv4 address 6 if it is an IPv6 address */ int string_is_ip_address(const uschar *s, int *maskptr) { int i; int yield = 4; /* If an optional mask is permitted, check for it. If found, pass back the offset. */ if (maskptr != NULL) { const uschar *ss = s + Ustrlen(s); *maskptr = 0; if (s != ss && isdigit(*(--ss))) { while (ss > s && isdigit(ss[-1])) ss--; if (ss > s && *(--ss) == '/') *maskptr = ss - s; } } /* A colon anywhere in the string => IPv6 address */ if (Ustrchr(s, ':') != NULL) { BOOL had_double_colon = FALSE; BOOL v4end = FALSE; int count = 0; yield = 6; /* An IPv6 address must start with hex digit or double colon. A single colon is invalid. */ if (*s == ':' && *(++s) != ':') return 0; /* Now read up to 8 components consisting of up to 4 hex digits each. There may be one and only one appearance of double colon, which implies any number of binary zero bits. The number of preceding components is held in count. */ for (count = 0; count < 8; count++) { /* If the end of the string is reached before reading 8 components, the address is valid provided a double colon has been read. This also applies if we hit the / that introduces a mask or the % that introduces the interface specifier (scope id) of a link-local address. */ if (*s == 0 || *s == '%' || *s == '/') return had_double_colon? yield : 0; /* If a component starts with an additional colon, we have hit a double colon. This is permitted to appear once only, and counts as at least one component. The final component may be of this form. */ if (*s == ':') { if (had_double_colon) return 0; had_double_colon = TRUE; s++; continue; } /* If the remainder of the string contains a dot but no colons, we can expect a trailing IPv4 address. This is valid if either there has been no double-colon and this is the 7th component (with the IPv4 address being the 7th & 8th components), OR if there has been a double-colon and fewer than 6 components. */ if (Ustrchr(s, ':') == NULL && Ustrchr(s, '.') != NULL) { if ((!had_double_colon && count != 6) || (had_double_colon && count > 6)) return 0; v4end = TRUE; yield = 6; break; } /* Check for at least one and not more than 4 hex digits for this component. */ if (!isxdigit(*s++)) return 0; if (isxdigit(*s) && isxdigit(*(++s)) && isxdigit(*(++s))) s++; /* If the component is terminated by colon and there is more to follow, skip over the colon. If there is no more to follow the address is invalid. */ if (*s == ':' && *(++s) == 0) return 0; } /* If about to handle a trailing IPv4 address, drop through. Otherwise all is well if we are at the end of the string or at the mask or at a percent sign, which introduces the interface specifier (scope id) of a link local address. */ if (!v4end) return (*s == 0 || *s == '%' || (*s == '/' && maskptr != NULL && *maskptr != 0))? yield : 0; } /* Test for IPv4 address, which may be the tail-end of an IPv6 address. */ for (i = 0; i < 4; i++) { if (i != 0 && *s++ != '.') return 0; if (!isdigit(*s++)) return 0; if (isdigit(*s) && isdigit(*(++s))) s++; } return (*s == 0 || (*s == '/' && maskptr != NULL && *maskptr != 0))? yield : 0; } #endif /* COMPILE_UTILITY */ /************************************************* * Format message size * *************************************************/ /* Convert a message size in bytes to printing form, rounding according to the magnitude of the number. A value of zero causes a string of spaces to be returned. Arguments: size the message size in bytes buffer where to put the answer Returns: pointer to the buffer a string of exactly 5 characters is normally returned */ uschar * string_format_size(int size, uschar *buffer) { if (size == 0) Ustrcpy(buffer, " "); else if (size < 1024) sprintf(CS buffer, "%5d", size); else if (size < 10*1024) sprintf(CS buffer, "%4.1fK", (double)size / 1024.0); else if (size < 1024*1024) sprintf(CS buffer, "%4dK", (size + 512)/1024); else if (size < 10*1024*1024) sprintf(CS buffer, "%4.1fM", (double)size / (1024.0 * 1024.0)); else sprintf(CS buffer, "%4dM", (size + 512 * 1024)/(1024*1024)); return buffer; } #ifndef COMPILE_UTILITY /************************************************* * Convert a number to base 62 format * *************************************************/ /* Convert a long integer into an ASCII base 62 string. For Cygwin the value of BASE_62 is actually 36. Always return exactly 6 characters plus zero, in a static area. Argument: a long integer Returns: pointer to base 62 string */ uschar * string_base62(unsigned long int value) { static uschar yield[7]; uschar *p = yield + sizeof(yield) - 1; *p = 0; while (p > yield) { *(--p) = base62_chars[value % BASE_62]; value /= BASE_62; } return yield; } #endif /* COMPILE_UTILITY */ /************************************************* * Interpret escape sequence * *************************************************/ /* This function is called from several places where escape sequences are to be interpreted in strings. Arguments: pp points a pointer to the initiating "\" in the string; the pointer gets updated to point to the final character Returns: the value of the character escape */ int string_interpret_escape(const uschar **pp) { #ifdef COMPILE_UTILITY const uschar *hex_digits= CUS"0123456789abcdef"; #endif int ch; const uschar *p = *pp; ch = *(++p); if (isdigit(ch) && ch != '8' && ch != '9') { ch -= '0'; if (isdigit(p[1]) && p[1] != '8' && p[1] != '9') { ch = ch * 8 + *(++p) - '0'; if (isdigit(p[1]) && p[1] != '8' && p[1] != '9') ch = ch * 8 + *(++p) - '0'; } } else switch(ch) { case 'b': ch = '\b'; break; case 'f': ch = '\f'; break; case 'n': ch = '\n'; break; case 'r': ch = '\r'; break; case 't': ch = '\t'; break; case 'v': ch = '\v'; break; case 'x': ch = 0; if (isxdigit(p[1])) { ch = ch * 16 + Ustrchr(hex_digits, tolower(*(++p))) - hex_digits; if (isxdigit(p[1])) ch = ch * 16 + Ustrchr(hex_digits, tolower(*(++p))) - hex_digits; } break; } *pp = p; return ch; } #ifndef COMPILE_UTILITY /************************************************* * Ensure string is printable * *************************************************/ /* This function is called for critical strings. It checks for any non-printing characters, and if any are found, it makes a new copy of the string with suitable escape sequences. It is most often called by the macro string_printing(), which sets allow_tab TRUE. Arguments: s the input string allow_tab TRUE to allow tab as a printing character Returns: string with non-printers encoded as printing sequences */ const uschar * string_printing2(const uschar *s, BOOL allow_tab) { int nonprintcount = 0; int length = 0; const uschar *t = s; uschar *ss, *tt; while (*t != 0) { int c = *t++; if (!mac_isprint(c) || (!allow_tab && c == '\t')) nonprintcount++; length++; } if (nonprintcount == 0) return s; /* Get a new block of store guaranteed big enough to hold the expanded string. */ ss = store_get(length + nonprintcount * 3 + 1); /* Copy everying, escaping non printers. */ t = s; tt = ss; while (*t != 0) { int c = *t; if (mac_isprint(c) && (allow_tab || c != '\t')) *tt++ = *t++; else { *tt++ = '\\'; switch (*t) { case '\n': *tt++ = 'n'; break; case '\r': *tt++ = 'r'; break; case '\b': *tt++ = 'b'; break; case '\v': *tt++ = 'v'; break; case '\f': *tt++ = 'f'; break; case '\t': *tt++ = 't'; break; default: sprintf(CS tt, "%03o", *t); tt += 3; break; } t++; } } *tt = 0; return ss; } #endif /* COMPILE_UTILITY */ /************************************************* * Undo printing escapes in string * *************************************************/ /* This function is the reverse of string_printing2. It searches for backslash characters and if any are found, it makes a new copy of the string with escape sequences parsed. Otherwise it returns the original string. Arguments: s the input string Returns: string with printing escapes parsed back */ uschar * string_unprinting(uschar *s) { uschar *p, *q, *r, *ss; int len, off; p = Ustrchr(s, '\\'); if (!p) return s; len = Ustrlen(s) + 1; ss = store_get(len); q = ss; off = p - s; if (off) { memcpy(q, s, off); q += off; } while (*p) { if (*p == '\\') { *q++ = string_interpret_escape((const uschar **)&p); p++; } else { r = Ustrchr(p, '\\'); if (!r) { off = Ustrlen(p); memcpy(q, p, off); p += off; q += off; break; } else { off = r - p; memcpy(q, p, off); q += off; p = r; } } } *q = '\0'; return ss; } /************************************************* * Copy and save string * *************************************************/ /* This function assumes that memcpy() is faster than strcpy(). Argument: string to copy Returns: copy of string in new store */ uschar * string_copy(const uschar *s) { int len = Ustrlen(s) + 1; uschar *ss = store_get(len); memcpy(ss, s, len); return ss; } /************************************************* * Copy and save string in malloc'd store * *************************************************/ /* This function assumes that memcpy() is faster than strcpy(). Argument: string to copy Returns: copy of string in new store */ uschar * string_copy_malloc(const uschar *s) { int len = Ustrlen(s) + 1; uschar *ss = store_malloc(len); memcpy(ss, s, len); return ss; } /************************************************* * Copy, lowercase and save string * *************************************************/ /* Argument: string to copy Returns: copy of string in new store, with letters lowercased */ uschar * string_copylc(const uschar *s) { uschar *ss = store_get(Ustrlen(s) + 1); uschar *p = ss; while (*s != 0) *p++ = tolower(*s++); *p = 0; return ss; } /************************************************* * Copy and save string, given length * *************************************************/ /* It is assumed the data contains no zeros. A zero is added onto the end. Arguments: s string to copy n number of characters Returns: copy of string in new store */ uschar * string_copyn(const uschar *s, int n) { uschar *ss = store_get(n + 1); Ustrncpy(ss, s, n); ss[n] = 0; return ss; } /************************************************* * Copy, lowercase, and save string, given length * *************************************************/ /* It is assumed the data contains no zeros. A zero is added onto the end. Arguments: s string to copy n number of characters Returns: copy of string in new store, with letters lowercased */ uschar * string_copynlc(uschar *s, int n) { uschar *ss = store_get(n + 1); uschar *p = ss; while (n-- > 0) *p++ = tolower(*s++); *p = 0; return ss; } /************************************************* * Copy string if long, inserting newlines * *************************************************/ /* If the given string is longer than 75 characters, it is copied, and within the copy, certain space characters are converted into newlines. Argument: pointer to the string Returns: pointer to the possibly altered string */ uschar * string_split_message(uschar *msg) { uschar *s, *ss; if (msg == NULL || Ustrlen(msg) <= 75) return msg; s = ss = msg = string_copy(msg); for (;;) { int i = 0; while (i < 75 && *ss != 0 && *ss != '\n') ss++, i++; if (*ss == 0) break; if (*ss == '\n') s = ++ss; else { uschar *t = ss + 1; uschar *tt = NULL; while (--t > s + 35) { if (*t == ' ') { if (t[-1] == ':') { tt = t; break; } if (tt == NULL) tt = t; } } if (tt == NULL) /* Can't split behind - try ahead */ { t = ss + 1; while (*t != 0) { if (*t == ' ' || *t == '\n') { tt = t; break; } t++; } } if (tt == NULL) break; /* Can't find anywhere to split */ *tt = '\n'; s = ss = tt+1; } } return msg; } /************************************************* * Copy returned DNS domain name, de-escaping * *************************************************/ /* If a domain name contains top-bit characters, some resolvers return the fully qualified name with those characters turned into escapes. The convention is a backslash followed by _decimal_ digits. We convert these back into the original binary values. This will be relevant when allow_utf8_domains is set true and UTF-8 characters are used in domain names. Backslash can also be used to escape other characters, though we shouldn't come across them in domain names. Argument: the domain name string Returns: copy of string in new store, de-escaped */ uschar * string_copy_dnsdomain(uschar *s) { uschar *yield; uschar *ss = yield = store_get(Ustrlen(s) + 1); while (*s != 0) { if (*s != '\\') { *ss++ = *s++; } else if (isdigit(s[1])) { *ss++ = (s[1] - '0')*100 + (s[2] - '0')*10 + s[3] - '0'; s += 4; } else if (*(++s) != 0) { *ss++ = *s++; } } *ss = 0; return yield; } #ifndef COMPILE_UTILITY /************************************************* * Copy space-terminated or quoted string * *************************************************/ /* This function copies from a string until its end, or until whitespace is encountered, unless the string begins with a double quote, in which case the terminating quote is sought, and escaping within the string is done. The length of a de-quoted string can be no longer than the original, since escaping always turns n characters into 1 character. Argument: pointer to the pointer to the first character, which gets updated Returns: the new string */ uschar * string_dequote(const uschar **sptr) { const uschar *s = *sptr; uschar *t, *yield; /* First find the end of the string */ if (*s != '\"') { while (*s != 0 && !isspace(*s)) s++; } else { s++; while (*s != 0 && *s != '\"') { if (*s == '\\') (void)string_interpret_escape(&s); s++; } if (*s != 0) s++; } /* Get enough store to copy into */ t = yield = store_get(s - *sptr + 1); s = *sptr; /* Do the copy */ if (*s != '\"') { while (*s != 0 && !isspace(*s)) *t++ = *s++; } else { s++; while (*s != 0 && *s != '\"') { if (*s == '\\') *t++ = string_interpret_escape(&s); else *t++ = *s; s++; } if (*s != 0) s++; } /* Update the pointer and return the terminated copy */ *sptr = s; *t = 0; return yield; } #endif /* COMPILE_UTILITY */ /************************************************* * Format a string and save it * *************************************************/ /* The formatting is done by string_format, which checks the length of everything. Arguments: format a printf() format - deliberately char * rather than uschar * because it will most usually be a literal string ... arguments for format Returns: pointer to fresh piece of store containing sprintf'ed string */ uschar * string_sprintf(const char *format, ...) { va_list ap; uschar buffer[STRING_SPRINTF_BUFFER_SIZE]; va_start(ap, format); if (!string_vformat(buffer, sizeof(buffer), format, ap)) log_write(0, LOG_MAIN|LOG_PANIC_DIE, "string_sprintf expansion was longer than " SIZE_T_FMT " (%s)", sizeof(buffer), format); va_end(ap); return string_copy(buffer); } /************************************************* * Case-independent strncmp() function * *************************************************/ /* Arguments: s first string t second string n number of characters to compare Returns: < 0, = 0, or > 0, according to the comparison */ int strncmpic(const uschar *s, const uschar *t, int n) { while (n--) { int c = tolower(*s++) - tolower(*t++); if (c) return c; } return 0; } /************************************************* * Case-independent strcmp() function * *************************************************/ /* Arguments: s first string t second string Returns: < 0, = 0, or > 0, according to the comparison */ int strcmpic(const uschar *s, const uschar *t) { while (*s != 0) { int c = tolower(*s++) - tolower(*t++); if (c != 0) return c; } return *t; } /************************************************* * Case-independent strstr() function * *************************************************/ /* The third argument specifies whether whitespace is required to follow the matched string. Arguments: s string to search t substring to search for space_follows if TRUE, match only if whitespace follows Returns: pointer to substring in string, or NULL if not found */ uschar * strstric(uschar *s, uschar *t, BOOL space_follows) { uschar *p = t; uschar *yield = NULL; int cl = tolower(*p); int cu = toupper(*p); while (*s) { if (*s == cl || *s == cu) { if (yield == NULL) yield = s; if (*(++p) == 0) { if (!space_follows || s[1] == ' ' || s[1] == '\n' ) return yield; yield = NULL; p = t; } cl = tolower(*p); cu = toupper(*p); s++; } else if (yield != NULL) { yield = NULL; p = t; cl = tolower(*p); cu = toupper(*p); } else s++; } return NULL; } #ifndef COMPILE_UTILITY /************************************************* * Get next string from separated list * *************************************************/ /* Leading and trailing space is removed from each item. The separator in the list is controlled by the int pointed to by the separator argument as follows: If the value is > 0 it is used as the separator. This is typically used for sublists such as slash-separated options. The value is always a printing character. (If the value is actually > UCHAR_MAX there is only one item in the list. This is used for some cases when called via functions that sometimes plough through lists, and sometimes are given single items.) If the value is <= 0, the string is inspected for a leading 0 && isspace(buffer[p-1])) p--; buffer[p] = 0; } /* Handle the case when a buffer is not provided. */ else { int size = 0; int ptr = 0; const uschar *ss; /* We know that *s != 0 at this point. However, it might be pointing to a separator, which could indicate an empty string, or (if an ispunct() character) could be doubled to indicate a separator character as data at the start of a string. Avoid getting working memory for an empty item. */ if (*s == sep) { s++; if (*s != sep || sep_is_special) { *listptr = s; return string_copy(US""); } } /* Not an empty string; the first character is guaranteed to be a data character. */ for (;;) { for (ss = s + 1; *ss != 0 && *ss != sep; ss++); buffer = string_cat(buffer, &size, &ptr, s, ss-s); s = ss; if (*s == 0 || *(++s) != sep || sep_is_special) break; } while (ptr > 0 && isspace(buffer[ptr-1])) ptr--; buffer[ptr] = 0; } /* Update the current pointer and return the new string */ *listptr = s; return buffer; } #endif /* COMPILE_UTILITY */ #ifndef COMPILE_UTILITY /************************************************ * Add element to seperated list * ************************************************/ /* This function is used to build a list, returning an allocated null-terminated growable string. The given element has any embedded seperator characters doubled. Arguments: list points to the start of the list that is being built, or NULL if this is a new list that has no contents yet sep list seperator charactoer ele new lement to be appended to the list Returns: pointer to the start of the list, changed if copied for expansion. */ uschar * string_append_listele(uschar * list, uschar sep, const uschar * ele) { uschar * new = NULL; int sz = 0, off = 0; uschar * sp; if (list) { new = string_cat(new, &sz, &off, list, Ustrlen(list)); new = string_cat(new, &sz, &off, &sep, 1); } while((sp = Ustrchr(ele, sep))) { new = string_cat(new, &sz, &off, ele, sp-ele+1); new = string_cat(new, &sz, &off, &sep, 1); ele = sp+1; } new = string_cat(new, &sz, &off, ele, Ustrlen(ele)); new[off] = '\0'; return new; } static const uschar * Ustrnchr(const uschar * s, int c, unsigned * len) { unsigned siz = *len; while (siz) { if (!*s) return NULL; if (*s == c) { *len = siz; return s; } s++; siz--; } return NULL; } uschar * string_append_listele_n(uschar * list, uschar sep, const uschar * ele, unsigned len) { uschar * new = NULL; int sz = 0, off = 0; const uschar * sp; if (list) { new = string_cat(new, &sz, &off, list, Ustrlen(list)); new = string_cat(new, &sz, &off, &sep, 1); } while((sp = Ustrnchr(ele, sep, &len))) { new = string_cat(new, &sz, &off, ele, sp-ele+1); new = string_cat(new, &sz, &off, &sep, 1); ele = sp+1; len--; } new = string_cat(new, &sz, &off, ele, len); new[off] = '\0'; return new; } #endif /* COMPILE_UTILITY */ #ifndef COMPILE_UTILITY /************************************************* * Add chars to string * *************************************************/ /* This function is used when building up strings of unknown length. Room is always left for a terminating zero to be added to the string that is being built. This function does not require the string that is being added to be NUL terminated, because the number of characters to add is given explicitly. It is sometimes called to extract parts of other strings. Arguments: string points to the start of the string that is being built, or NULL if this is a new string that has no contents yet size points to a variable that holds the current capacity of the memory block (updated if changed) ptr points to a variable that holds the offset at which to add characters, updated to the new offset s points to characters to add count count of characters to add; must not exceed the length of s, if s is a C string If string is given as NULL, *size and *ptr should both be zero. Returns: pointer to the start of the string, changed if copied for expansion. Note that a NUL is not added, though space is left for one. This is because string_cat() is often called multiple times to build up a string - there's no point adding the NUL till the end. */ uschar * string_cat(uschar *string, int *size, int *ptr, const uschar *s, int count) { int p = *ptr; if (p + count >= *size) { int oldsize = *size; /* Mostly, string_cat() is used to build small strings of a few hundred characters at most. There are times, however, when the strings are very much longer (for example, a lookup that returns a vast number of alias addresses). To try to keep things reasonable, we use increments whose size depends on the existing length of the string. */ int inc = (oldsize < 4096)? 100 : 1024; while (*size <= p + count) *size += inc; /* New string */ if (string == NULL) string = store_get(*size); /* Try to extend an existing allocation. If the result of calling store_extend() is false, either there isn't room in the current memory block, or this string is not the top item on the dynamic store stack. We then have to get a new chunk of store and copy the old string. When building large strings, it is helpful to call store_release() on the old string, to release memory blocks that have become empty. (The block will be freed if the string is at its start.) However, we can do this only if we know that the old string was the last item on the dynamic memory stack. This is the case if it matches store_last_get. */ else if (!store_extend(string, oldsize, *size)) { BOOL release_ok = store_last_get[store_pool] == string; uschar *newstring = store_get(*size); memcpy(newstring, string, p); if (release_ok) store_release(string); string = newstring; } } /* Because we always specify the exact number of characters to copy, we can use memcpy(), which is likely to be more efficient than strncopy() because the latter has to check for zero bytes. */ memcpy(string + p, s, count); *ptr = p + count; return string; } #endif /* COMPILE_UTILITY */ #ifndef COMPILE_UTILITY /************************************************* * Append strings to another string * *************************************************/ /* This function can be used to build a string from many other strings. It calls string_cat() to do the dirty work. Arguments: string points to the start of the string that is being built, or NULL if this is a new string that has no contents yet size points to a variable that holds the current capacity of the memory block (updated if changed) ptr points to a variable that holds the offset at which to add characters, updated to the new offset count the number of strings to append ... "count" uschar* arguments, which must be valid zero-terminated C strings Returns: pointer to the start of the string, changed if copied for expansion. The string is not zero-terminated - see string_cat() above. */ uschar * string_append(uschar *string, int *size, int *ptr, int count, ...) { va_list ap; int i; va_start(ap, count); for (i = 0; i < count; i++) { uschar *t = va_arg(ap, uschar *); string = string_cat(string, size, ptr, t, Ustrlen(t)); } va_end(ap); return string; } #endif /************************************************* * Format a string with length checks * *************************************************/ /* This function is used to format a string with checking of the length of the output for all conversions. It protects Exim from absent-mindedness when calling functions like debug_printf and string_sprintf, and elsewhere. There are two different entry points to what is actually the same function, depending on whether the variable length list of data arguments are given explicitly or as a va_list item. The formats are the usual printf() ones, with some omissions (never used) and two additions for strings: %S forces lower case, and %#s or %#S prints nothing for a NULL string. Without the # "NULL" is printed (useful in debugging). There is also the addition of %D and %M, which insert the date in the form used for datestamped log files. Arguments: buffer a buffer in which to put the formatted string buflen the length of the buffer format the format string - deliberately char * and not uschar * ... or ap variable list of supplementary arguments Returns: TRUE if the result fitted in the buffer */ BOOL string_format(uschar *buffer, int buflen, const char *format, ...) { BOOL yield; va_list ap; va_start(ap, format); yield = string_vformat(buffer, buflen, format, ap); va_end(ap); return yield; } BOOL string_vformat(uschar *buffer, int buflen, const char *format, va_list ap) { /* We assume numbered ascending order, C does not guarantee that */ enum { L_NORMAL=1, L_SHORT=2, L_LONG=3, L_LONGLONG=4, L_LONGDOUBLE=5, L_SIZE=6 }; BOOL yield = TRUE; int width, precision; const char *fp = format; /* Deliberately not unsigned */ uschar *p = buffer; uschar *last = buffer + buflen - 1; string_datestamp_offset = -1; /* Datestamp not inserted */ string_datestamp_length = 0; /* Datestamp not inserted */ string_datestamp_type = 0; /* Datestamp not inserted */ /* Scan the format and handle the insertions */ while (*fp != 0) { int length = L_NORMAL; int *nptr; int slen; const char *null = "NULL"; /* ) These variables */ const char *item_start, *s; /* ) are deliberately */ char newformat[16]; /* ) not unsigned */ /* Non-% characters just get copied verbatim */ if (*fp != '%') { if (p >= last) { yield = FALSE; break; } *p++ = (uschar)*fp++; continue; } /* Deal with % characters. Pick off the width and precision, for checking strings, skipping over the flag and modifier characters. */ item_start = fp; width = precision = -1; if (strchr("-+ #0", *(++fp)) != NULL) { if (*fp == '#') null = ""; fp++; } if (isdigit((uschar)*fp)) { width = *fp++ - '0'; while (isdigit((uschar)*fp)) width = width * 10 + *fp++ - '0'; } else if (*fp == '*') { width = va_arg(ap, int); fp++; } if (*fp == '.') { if (*(++fp) == '*') { precision = va_arg(ap, int); fp++; } else { precision = 0; while (isdigit((uschar)*fp)) precision = precision*10 + *fp++ - '0'; } } /* Skip over 'h', 'L', 'l', 'll' and 'z', remembering the item length */ if (*fp == 'h') { fp++; length = L_SHORT; } else if (*fp == 'L') { fp++; length = L_LONGDOUBLE; } else if (*fp == 'l') { if (fp[1] == 'l') { fp += 2; length = L_LONGLONG; } else { fp++; length = L_LONG; } } else if (*fp == 'z') { fp++; length = L_SIZE; } /* Handle each specific format type. */ switch (*fp++) { case 'n': nptr = va_arg(ap, int *); *nptr = p - buffer; break; case 'd': case 'o': case 'u': case 'x': case 'X': if (p >= last - ((length > L_LONG)? 24 : 12)) { yield = FALSE; goto END_FORMAT; } strncpy(newformat, item_start, fp - item_start); newformat[fp - item_start] = 0; /* Short int is promoted to int when passing through ..., so we must use int for va_arg(). */ switch(length) { case L_SHORT: case L_NORMAL: sprintf(CS p, newformat, va_arg(ap, int)); break; case L_LONG: sprintf(CS p, newformat, va_arg(ap, long int)); break; case L_LONGLONG: sprintf(CS p, newformat, va_arg(ap, LONGLONG_T)); break; case L_SIZE: sprintf(CS p, newformat, va_arg(ap, size_t)); break; } while (*p) p++; break; case 'p': if (p >= last - 24) { yield = FALSE; goto END_FORMAT; } strncpy(newformat, item_start, fp - item_start); newformat[fp - item_start] = 0; sprintf(CS p, newformat, va_arg(ap, void *)); while (*p) p++; break; /* %f format is inherently insecure if the numbers that it may be handed are unknown (e.g. 1e300). However, in Exim, %f is used for printing load averages, and these are actually stored as integers (load average * 1000) so the size of the numbers is constrained. It is also used for formatting sending rates, where the simplicity of the format prevents overflow. */ case 'f': case 'e': case 'E': case 'g': case 'G': if (precision < 0) precision = 6; if (p >= last - precision - 8) { yield = FALSE; goto END_FORMAT; } strncpy(newformat, item_start, fp - item_start); newformat[fp-item_start] = 0; if (length == L_LONGDOUBLE) sprintf(CS p, newformat, va_arg(ap, long double)); else sprintf(CS p, newformat, va_arg(ap, double)); while (*p) p++; break; /* String types */ case '%': if (p >= last) { yield = FALSE; goto END_FORMAT; } *p++ = '%'; break; case 'c': if (p >= last) { yield = FALSE; goto END_FORMAT; } *p++ = va_arg(ap, int); break; case 'D': /* Insert daily datestamp for log file names */ s = CS tod_stamp(tod_log_datestamp_daily); string_datestamp_offset = p - buffer; /* Passed back via global */ string_datestamp_length = Ustrlen(s); /* Passed back via global */ string_datestamp_type = tod_log_datestamp_daily; slen = string_datestamp_length; goto INSERT_STRING; case 'M': /* Insert monthly datestamp for log file names */ s = CS tod_stamp(tod_log_datestamp_monthly); string_datestamp_offset = p - buffer; /* Passed back via global */ string_datestamp_length = Ustrlen(s); /* Passed back via global */ string_datestamp_type = tod_log_datestamp_monthly; slen = string_datestamp_length; goto INSERT_STRING; case 's': case 'S': /* Forces *lower* case */ s = va_arg(ap, char *); if (s == NULL) s = null; slen = Ustrlen(s); INSERT_STRING: /* Come to from %D or %M above */ /* If the width is specified, check that there is a precision set; if not, set it to the width to prevent overruns of long strings. */ if (width >= 0) { if (precision < 0) precision = width; } /* If a width is not specified and the precision is specified, set the width to the precision, or the string length if shorted. */ else if (precision >= 0) { width = (precision < slen)? precision : slen; } /* If neither are specified, set them both to the string length. */ else width = precision = slen; /* Check string space, and add the string to the buffer if ok. If not OK, add part of the string (debugging uses this to show as much as possible). */ if (p == last) { yield = FALSE; goto END_FORMAT; } if (p >= last - width) { yield = FALSE; width = precision = last - p - 1; if (width < 0) width = 0; if (precision < 0) precision = 0; } sprintf(CS p, "%*.*s", width, precision, s); if (fp[-1] == 'S') while (*p) { *p = tolower(*p); p++; } else while (*p) p++; if (!yield) goto END_FORMAT; break; /* Some things are never used in Exim; also catches junk. */ default: strncpy(newformat, item_start, fp - item_start); newformat[fp-item_start] = 0; log_write(0, LOG_MAIN|LOG_PANIC_DIE, "string_format: unsupported type " "in \"%s\" in \"%s\"", newformat, format); break; } } /* Ensure string is complete; return TRUE if got to the end of the format */ END_FORMAT: *p = 0; return yield; } #ifndef COMPILE_UTILITY /************************************************* * Generate an "open failed" message * *************************************************/ /* This function creates a message after failure to open a file. It includes a string supplied as data, adds the strerror() text, and if the failure was "Permission denied", reads and includes the euid and egid. Arguments: eno the value of errno after the failure format a text format string - deliberately not uschar * ... arguments for the format string Returns: a message, in dynamic store */ uschar * string_open_failed(int eno, const char *format, ...) { va_list ap; uschar buffer[1024]; Ustrcpy(buffer, "failed to open "); va_start(ap, format); /* Use the checked formatting routine to ensure that the buffer does not overflow. It should not, since this is called only for internally specified messages. If it does, the message just gets truncated, and there doesn't seem much we can do about that. */ (void)string_vformat(buffer+15, sizeof(buffer) - 15, format, ap); return (eno == EACCES)? string_sprintf("%s: %s (euid=%ld egid=%ld)", buffer, strerror(eno), (long int)geteuid(), (long int)getegid()) : string_sprintf("%s: %s", buffer, strerror(eno)); } #endif /* COMPILE_UTILITY */ #ifndef COMPILE_UTILITY /************************************************* * Generate local prt for logging * *************************************************/ /* This function is a subroutine for use in string_log_address() below. Arguments: addr the address being logged yield the current dynamic buffer pointer sizeptr points to current size ptrptr points to current insert pointer Returns: the new value of the buffer pointer */ static uschar * string_get_localpart(address_item *addr, uschar *yield, int *sizeptr, int *ptrptr) { uschar * s; s = addr->prefix; if (testflag(addr, af_include_affixes) && s) { #ifdef EXPERIMENTAL_INTERNATIONAL if (testflag(addr, af_utf8_downcvt)) s = string_localpart_utf8_to_alabel(s, NULL); #endif yield = string_cat(yield, sizeptr, ptrptr, s, Ustrlen(s)); } s = addr->local_part; #ifdef EXPERIMENTAL_INTERNATIONAL if (testflag(addr, af_utf8_downcvt)) s = string_localpart_utf8_to_alabel(s, NULL); #endif yield = string_cat(yield, sizeptr, ptrptr, s, Ustrlen(s)); s = addr->suffix; if (testflag(addr, af_include_affixes) && s) { #ifdef EXPERIMENTAL_INTERNATIONAL if (testflag(addr, af_utf8_downcvt)) s = string_localpart_utf8_to_alabel(s, NULL); #endif yield = string_cat(yield, sizeptr, ptrptr, s, Ustrlen(s)); } return yield; } /************************************************* * Generate log address list * *************************************************/ /* This function generates a list consisting of an address and its parents, for use in logging lines. For saved onetime aliased addresses, the onetime parent field is used. If the address was delivered by a transport with rcpt_include_ affixes set, the af_include_affixes bit will be set in the address. In that case, we include the affixes here too. Arguments: addr bottom (ultimate) address all_parents if TRUE, include all parents success TRUE for successful delivery Returns: a string in dynamic store */ uschar * string_log_address(address_item *addr, BOOL all_parents, BOOL success) { int size = 64; int ptr = 0; BOOL add_topaddr = TRUE; uschar *yield = store_get(size); address_item *topaddr; /* Find the ultimate parent */ for (topaddr = addr; topaddr->parent != NULL; topaddr = topaddr->parent); /* We start with just the local part for pipe, file, and reply deliveries, and for successful local deliveries from routers that have the log_as_local flag set. File deliveries from filters can be specified as non-absolute paths in cases where the transport is goin to complete the path. If there is an error before this happens (expansion failure) the local part will not be updated, and so won't necessarily look like a path. Add extra text for this case. */ if (testflag(addr, af_pfr) || (success && addr->router != NULL && addr->router->log_as_local && addr->transport != NULL && addr->transport->info->local)) { if (testflag(addr, af_file) && addr->local_part[0] != '/') yield = string_cat(yield, &size, &ptr, CUS"save ", 5); yield = string_get_localpart(addr, yield, &size, &ptr); } /* Other deliveries start with the full address. It we have split it into local part and domain, use those fields. Some early failures can happen before the splitting is done; in those cases use the original field. */ else { if (addr->local_part != NULL) { const uschar * s; yield = string_get_localpart(addr, yield, &size, &ptr); yield = string_cat(yield, &size, &ptr, US"@", 1); s = addr->domain; #ifdef EXPERIMENTAL_INTERNATIONAL if (testflag(addr, af_utf8_downcvt)) s = string_localpart_utf8_to_alabel(s, NULL); #endif yield = string_cat(yield, &size, &ptr, s, Ustrlen(s) ); } else { yield = string_cat(yield, &size, &ptr, addr->address, Ustrlen(addr->address)); } yield[ptr] = 0; /* If the address we are going to print is the same as the top address, and all parents are not being included, don't add on the top address. First of all, do a caseless comparison; if this succeeds, do a caseful comparison on the local parts. */ if (strcmpic(yield, topaddr->address) == 0 && Ustrncmp(yield, topaddr->address, Ustrchr(yield, '@') - yield) == 0 && addr->onetime_parent == NULL && (!all_parents || addr->parent == NULL || addr->parent == topaddr)) add_topaddr = FALSE; } /* If all parents are requested, or this is a local pipe/file/reply, and there is at least one intermediate parent, show it in brackets, and continue with all of them if all are wanted. */ if ((all_parents || testflag(addr, af_pfr)) && addr->parent != NULL && addr->parent != topaddr) { uschar *s = US" ("; address_item *addr2; for (addr2 = addr->parent; addr2 != topaddr; addr2 = addr2->parent) { yield = string_cat(yield, &size, &ptr, s, 2); yield = string_cat(yield, &size, &ptr, addr2->address, Ustrlen(addr2->address)); if (!all_parents) break; s = US", "; } yield = string_cat(yield, &size, &ptr, US")", 1); } /* Add the top address if it is required */ if (add_topaddr) { yield = string_cat(yield, &size, &ptr, US" <", 2); if (addr->onetime_parent == NULL) yield = string_cat(yield, &size, &ptr, topaddr->address, Ustrlen(topaddr->address)); else yield = string_cat(yield, &size, &ptr, addr->onetime_parent, Ustrlen(addr->onetime_parent)); yield = string_cat(yield, &size, &ptr, US">", 1); } yield[ptr] = 0; /* string_cat() leaves space */ return yield; } #endif /* COMPILE_UTILITY */ /************************************************* ************************************************** * Stand-alone test program * ************************************************** *************************************************/ #ifdef STAND_ALONE int main(void) { uschar buffer[256]; printf("Testing is_ip_address\n"); while (fgets(CS buffer, sizeof(buffer), stdin) != NULL) { int offset; buffer[Ustrlen(buffer) - 1] = 0; printf("%d\n", string_is_ip_address(buffer, NULL)); printf("%d %d %s\n", string_is_ip_address(buffer, &offset), offset, buffer); } printf("Testing string_nextinlist\n"); while (fgets(CS buffer, sizeof(buffer), stdin) != NULL) { uschar *list = buffer; uschar *lp1, *lp2; uschar item[256]; int sep1 = 0; int sep2 = 0; if (*list == '<') { sep1 = sep2 = list[1]; list += 2; } lp1 = lp2 = list; for (;;) { uschar *item1 = string_nextinlist(&lp1, &sep1, item, sizeof(item)); uschar *item2 = string_nextinlist(&lp2, &sep2, NULL, 0); if (item1 == NULL && item2 == NULL) break; if (item == NULL || item2 == NULL || Ustrcmp(item1, item2) != 0) { printf("***ERROR\nitem1=\"%s\"\nitem2=\"%s\"\n", (item1 == NULL)? "NULL" : CS item1, (item2 == NULL)? "NULL" : CS item2); break; } else printf(" \"%s\"\n", CS item1); } } /* This is a horrible lash-up, but it serves its purpose. */ printf("Testing string_format\n"); while (fgets(CS buffer, sizeof(buffer), stdin) != NULL) { void *args[3]; long long llargs[3]; double dargs[3]; int dflag = 0; int llflag = 0; int n = 0; int count; int countset = 0; uschar format[256]; uschar outbuf[256]; uschar *s; buffer[Ustrlen(buffer) - 1] = 0; s = Ustrchr(buffer, ','); if (s == NULL) s = buffer + Ustrlen(buffer); Ustrncpy(format, buffer, s - buffer); format[s-buffer] = 0; if (*s == ',') s++; while (*s != 0) { uschar *ss = s; s = Ustrchr(ss, ','); if (s == NULL) s = ss + Ustrlen(ss); if (isdigit(*ss)) { Ustrncpy(outbuf, ss, s-ss); if (Ustrchr(outbuf, '.') != NULL) { dflag = 1; dargs[n++] = Ustrtod(outbuf, NULL); } else if (Ustrstr(outbuf, "ll") != NULL) { llflag = 1; llargs[n++] = strtoull(CS outbuf, NULL, 10); } else { args[n++] = (void *)Uatoi(outbuf); } } else if (Ustrcmp(ss, "*") == 0) { args[n++] = (void *)(&count); countset = 1; } else { uschar *sss = malloc(s - ss + 1); Ustrncpy(sss, ss, s-ss); args[n++] = sss; } if (*s == ',') s++; } if (!dflag && !llflag) printf("%s\n", string_format(outbuf, sizeof(outbuf), CS format, args[0], args[1], args[2])? "True" : "False"); else if (dflag) printf("%s\n", string_format(outbuf, sizeof(outbuf), CS format, dargs[0], dargs[1], dargs[2])? "True" : "False"); else printf("%s\n", string_format(outbuf, sizeof(outbuf), CS format, llargs[0], llargs[1], llargs[2])? "True" : "False"); printf("%s\n", CS outbuf); if (countset) printf("count=%d\n", count); } return 0; } #endif /* End of string.c */