Add ${rfc2047d: expansion.

[exim.git] / src / src / expand.c
diff --git a/src/src/expand.c b/src/src/expand.c

index 273f2a507fdbc5111e5ba51bcdc56fe2772288c2..b2674dd4220734f150f061a9944cbbcefccde4b8 100644 (file)
--- a/src/src/expand.c
+++ b/src/src/expand.c
@@ -1,10 +1,10 @@
-/* $Cambridge: exim/src/src/expand.c,v 1.41 2005/08/23 08:46:33 ph10 Exp $ */
+/* $Cambridge: exim/src/src/expand.c,v 1.79 2007/01/31 11:30:08 ph10 Exp $ */
  
  /*************************************************
  *     Exim - an Internet mail transport agent    *
  *************************************************/
  
-/* Copyright (c) University of Cambridge 1995 - 2005 */
+/* Copyright (c) University of Cambridge 1995 - 2007 */
  /* See the file NOTICE for conditions of use and distribution. */
  
  
@@ -13,12 +13,20 @@
  
  #include "exim.h"
  
+/* Recursively called function */
+
+static uschar *expand_string_internal(uschar *, BOOL, uschar **, BOOL);
+
  #ifdef STAND_ALONE
  #ifndef SUPPORT_CRYPTEQ
  #define SUPPORT_CRYPTEQ
  #endif
  #endif
  
+#ifdef LOOKUP_LDAP
+#include "lookups/ldap.h"
+#endif
+
  #ifdef SUPPORT_CRYPTEQ
  #ifdef CRYPT_H
  #include <crypt.h>
@@ -28,15 +36,63 @@ extern char* crypt16(char*, char*);
  #endif
  #endif
  
-#ifdef LOOKUP_LDAP
-#include "lookups/ldap.h"
-#endif
-
-
-
-/* Recursively called function */
+/* The handling of crypt16() is a mess. I will record below the analysis of the
+mess that was sent to me. We decided, however, to make changing this very low
+priority, because in practice people are moving away from the crypt()
+algorithms nowadays, so it doesn't seem worth it.
+
+<quote>
+There is an algorithm named "crypt16" in Ultrix and Tru64.  It crypts
+the first 8 characters of the password using a 20-round version of crypt
+(standard crypt does 25 rounds).  It then crypts the next 8 characters,
+or an empty block if the password is less than 9 characters, using a
+20-round version of crypt and the same salt as was used for the first
+block.  Charaters after the first 16 are ignored.  It always generates
+a 16-byte hash, which is expressed together with the salt as a string
+of 24 base 64 digits.  Here are some links to peruse:
+
+        http://cvs.pld.org.pl/pam/pamcrypt/crypt16.c?rev=1.2
+        http://seclists.org/bugtraq/1999/Mar/0076.html
+
+There's a different algorithm named "bigcrypt" in HP-UX, Digital Unix,
+and OSF/1.  This is the same as the standard crypt if given a password
+of 8 characters or less.  If given more, it first does the same as crypt
+using the first 8 characters, then crypts the next 8 (the 9th to 16th)
+using as salt the first two base 64 digits from the first hash block.
+If the password is more than 16 characters then it crypts the 17th to 24th
+characters using as salt the first two base 64 digits from the second hash
+block.  And so on: I've seen references to it cutting off the password at
+40 characters (5 blocks), 80 (10 blocks), or 128 (16 blocks).  Some links:
+
+        http://cvs.pld.org.pl/pam/pamcrypt/bigcrypt.c?rev=1.2
+        http://seclists.org/bugtraq/1999/Mar/0109.html
+        http://h30097.www3.hp.com/docs/base_doc/DOCUMENTATION/HTML/AA-Q0R2D-
+             TET1_html/sec.c222.html#no_id_208
+
+Exim has something it calls "crypt16".  It will either use a native
+crypt16 or its own implementation.  A native crypt16 will presumably
+be the one that I called "crypt16" above.  The internal "crypt16"
+function, however, is a two-block-maximum implementation of what I called
+"bigcrypt".  The documentation matches the internal code.
+
+I suspect that whoever did the "crypt16" stuff for Exim didn't realise
+that crypt16 and bigcrypt were different things.
+
+Exim uses the LDAP-style scheme identifier "{crypt16}" to refer
+to whatever it is using under that name.  This unfortunately sets a
+precedent for using "{crypt16}" to identify two incompatible algorithms
+whose output can't be distinguished.  With "{crypt16}" thus rendered
+ambiguous, I suggest you deprecate it and invent two new identifiers
+for the two algorithms.
+
+Both crypt16 and bigcrypt are very poor algorithms, btw.  Hashing parts
+of the password separately means they can be cracked separately, so
+the double-length hash only doubles the cracking effort instead of
+squaring it.  I recommend salted SHA-1 ({SSHA}), or the Blowfish-based
+bcrypt ({CRYPT}$2a$).
+</quote>
+*/
  
-static uschar *expand_string_internal(uschar *, BOOL, uschar **, BOOL);
  
  
  
@@ -94,12 +150,14 @@ static uschar *op_table_underscore[] = {
    US"from_utf8",
    US"local_part",
    US"quote_local_part",
+  US"time_eval",
    US"time_interval"};
  
  enum {
    EOP_FROM_UTF8,
    EOP_LOCAL_PART,
    EOP_QUOTE_LOCAL_PART,
+  EOP_TIME_EVAL,
    EOP_TIME_INTERVAL };
  
  static uschar *op_table_main[] = {
@@ -123,6 +181,7 @@ static uschar *op_table_main[] = {
    US"nhash",
    US"quote",
    US"rfc2047",
+  US"rfc2047d",
    US"rxquote",
    US"s",
    US"sha1",
@@ -153,6 +212,7 @@ enum {
    EOP_NHASH,
    EOP_QUOTE,
    EOP_RFC2047,
+  EOP_RFC2047D,
    EOP_RXQUOTE,
    EOP_S,
    EOP_SHA1,
@@ -272,7 +332,8 @@ enum {
    vtype_stringptr,      /* value is address of pointer to string */
    vtype_msgbody,        /* as stringptr, but read when first required */
    vtype_msgbody_end,    /* ditto, the end of the message */
-  vtype_msgheaders,     /* the message's headers */
+  vtype_msgheaders,     /* the message's headers, processed */
+  vtype_msgheaders_raw, /* the message's headers, unprocessed */
    vtype_localpart,      /* extract local part from string */
    vtype_domain,         /* extract domain from string */
    vtype_recipients,     /* extract recipients from recipients list */
@@ -298,26 +359,8 @@ enum {
  /* This table must be kept in alphabetical order. */
  
  static var_entry var_table[] = {
-  { "acl_c0",              vtype_stringptr,   &acl_var[0] },
-  { "acl_c1",              vtype_stringptr,   &acl_var[1] },
-  { "acl_c2",              vtype_stringptr,   &acl_var[2] },
-  { "acl_c3",              vtype_stringptr,   &acl_var[3] },
-  { "acl_c4",              vtype_stringptr,   &acl_var[4] },
-  { "acl_c5",              vtype_stringptr,   &acl_var[5] },
-  { "acl_c6",              vtype_stringptr,   &acl_var[6] },
-  { "acl_c7",              vtype_stringptr,   &acl_var[7] },
-  { "acl_c8",              vtype_stringptr,   &acl_var[8] },
-  { "acl_c9",              vtype_stringptr,   &acl_var[9] },
-  { "acl_m0",              vtype_stringptr,   &acl_var[10] },
-  { "acl_m1",              vtype_stringptr,   &acl_var[11] },
-  { "acl_m2",              vtype_stringptr,   &acl_var[12] },
-  { "acl_m3",              vtype_stringptr,   &acl_var[13] },
-  { "acl_m4",              vtype_stringptr,   &acl_var[14] },
-  { "acl_m5",              vtype_stringptr,   &acl_var[15] },
-  { "acl_m6",              vtype_stringptr,   &acl_var[16] },
-  { "acl_m7",              vtype_stringptr,   &acl_var[17] },
-  { "acl_m8",              vtype_stringptr,   &acl_var[18] },
-  { "acl_m9",              vtype_stringptr,   &acl_var[19] },
+  /* WARNING: Do not invent variables whose names start acl_c or acl_m because
+     they will be confused with user-creatable ACL variables. */
    { "acl_verify_message",  vtype_stringptr,   &acl_verify_message },
    { "address_data",        vtype_stringptr,   &deliver_address_data },
    { "address_file",        vtype_stringptr,   &address_file },
@@ -401,6 +444,7 @@ static var_entry var_table[] = {
    { "message_body_size",   vtype_int,         &message_body_size },
    { "message_exim_id",     vtype_stringptr,   &message_id },
    { "message_headers",     vtype_msgheaders,  NULL },
+  { "message_headers_raw", vtype_msgheaders_raw, NULL },
    { "message_id",          vtype_stringptr,   &message_id },
    { "message_linecount",   vtype_int,         &message_linecount },
    { "message_size",        vtype_int,         &message_size },
@@ -450,6 +494,8 @@ static var_entry var_table[] = {
    { "rcpt_fail_count",     vtype_int,         &rcpt_fail_count },
    { "received_count",      vtype_int,         &received_count },
    { "received_for",        vtype_stringptr,   &received_for },
+  { "received_ip_address", vtype_stringptr,   &interface_address },
+  { "received_port",       vtype_int,         &interface_port },
    { "received_protocol",   vtype_stringptr,   &received_protocol },
    { "received_time",       vtype_int,         &received_time },
    { "recipient_data",      vtype_stringptr,   &recipient_data },
@@ -481,8 +527,12 @@ static var_entry var_table[] = {
    { "sender_rate_period",  vtype_stringptr,   &sender_rate_period },
    { "sender_rcvhost",      vtype_stringptr,   &sender_rcvhost },
    { "sender_verify_failure",vtype_stringptr,  &sender_verify_failure },
+  { "sending_ip_address",  vtype_stringptr,   &sending_ip_address },
+  { "sending_port",        vtype_int,         &sending_port },
    { "smtp_active_hostname", vtype_stringptr,  &smtp_active_hostname },
-  { "smtp_command_argument", vtype_stringptr, &smtp_command_argument },
+  { "smtp_command",        vtype_stringptr,   &smtp_cmd_buffer },
+  { "smtp_command_argument", vtype_stringptr, &smtp_cmd_argument },
+  { "smtp_count_at_connection_start", vtype_int, &smtp_accept_count },
    { "sn0",                 vtype_filter_int,  &filter_sn[0] },
    { "sn1",                 vtype_filter_int,  &filter_sn[1] },
    { "sn2",                 vtype_filter_int,  &filter_sn[2] },
@@ -1093,7 +1143,8 @@ Arguments:
    newsize       return the size of memory block that was obtained; may be NULL
                  if exists_only is TRUE
    want_raw      TRUE if called for $rh_ or $rheader_ variables; no processing,
-                other than concatenating, will be done on the header
+                other than concatenating, will be done on the header. Also used
+                for $message_headers_raw.
    charset       name of charset to translate MIME words to; used only if
                  want_raw is false; if NULL, no translation is done (this is
                  used for $bh_ and $bheader_)
@@ -1136,6 +1187,12 @@ for (i = 0; i < 2; i++)
            while (isspace(*t)) t++;          /* remove leading white space */
          ilen = h->slen - (t - h->text);     /* length to insert */
  
+        /* Unless wanted raw, remove trailing whitespace, including the
+        newline. */
+
+        if (!want_raw)
+          while (ilen > 0 && isspace(t[ilen-1])) ilen--;
+
          /* Set comma = 1 if handling a single header and it's one of those
          that contains an address list, except when asked for raw headers. Only
          need to do this once. */
@@ -1147,7 +1204,7 @@ for (i = 0; i < 2; i++)
          /* First pass - compute total store needed; second pass - compute
          total store used, including this header. */
  
-        size += ilen + comma;
+        size += ilen + comma + 1;  /* +1 for the newline */
  
          /* Second pass - concatentate the data, up to a maximum. Note that
          the loop stops when size hits the limit. */
@@ -1156,14 +1213,19 @@ for (i = 0; i < 2; i++)
            {
            if (size > header_insert_maxlen)
              {
-            ilen -= size - header_insert_maxlen;
+            ilen -= size - header_insert_maxlen - 1;
              comma = 0;
              }
            Ustrncpy(ptr, t, ilen);
            ptr += ilen;
-          if (comma != 0 && ilen > 0)
+
+          /* For a non-raw header, put in the comma if needed, then add
+          back the newline we removed above, provided there was some text in
+          the header. */
+
+          if (!want_raw && ilen > 0)
              {
-            ptr[-1] = ',';
+            if (comma != 0) *ptr++ = ',';
              *ptr++ = '\n';
              }
            }
@@ -1171,8 +1233,9 @@ for (i = 0; i < 2; i++)
        }
      }
  
-  /* At end of first pass, truncate size if necessary, and get the buffer
-  to hold the data, returning the buffer size. */
+  /* At end of first pass, return NULL if no header found. Then truncate size
+  if necessary, and get the buffer to hold the data, returning the buffer size.
+  */
  
    if (i == 0)
      {
@@ -1183,10 +1246,6 @@ for (i = 0; i < 2; i++)
      }
    }
  
-/* Remove a redundant added comma if present */
-
-if (comma != 0 && ptr > yield) ptr -= 2;
-
  /* That's all we do for raw header expansion. */
  
  if (want_raw)
@@ -1194,17 +1253,19 @@ if (want_raw)
    *ptr = 0;
    }
  
-/* Otherwise, we remove trailing whitespace, including newlines. Then we do RFC
-2047 decoding, translating the charset if requested. The rfc2047_decode2()
+/* Otherwise, remove a final newline and a redundant added comma. Then we do
+RFC 2047 decoding, translating the charset if requested. The rfc2047_decode2()
  function can return an error with decoded data if the charset translation
  fails. If decoding fails, it returns NULL. */
  
  else
    {
    uschar *decoded, *error;
-  while (ptr > yield && isspace(ptr[-1])) ptr--;
+  if (ptr > yield && ptr[-1] == '\n') ptr--;
+  if (ptr > yield && comma != 0 && ptr[-1] == ',') ptr--;
    *ptr = 0;
-  decoded = rfc2047_decode2(yield, TRUE, charset, '?', NULL, newsize, &error);
+  decoded = rfc2047_decode2(yield, check_rfc2047_length, charset, '?', NULL,
+    newsize, &error);
    if (error != NULL)
      {
      DEBUG(D_any) debug_printf("*** error in RFC 2047 decoding: %s\n"
@@ -1247,6 +1308,37 @@ find_variable(uschar *name, BOOL exists_only, BOOL skipping, int *newsize)
  int first = 0;
  int last = var_table_size;
  
+/* Handle ACL variables, whose names are of the form acl_cxxx or acl_mxxx.
+Originally, xxx had to be a number in the range 0-9 (later 0-19), but from
+release 4.64 onwards arbitrary names are permitted, as long as the first 5
+characters are acl_c or acl_m and the sixth is either a digit or an underscore
+(this gave backwards compatibility at the changeover). There may be built-in
+variables whose names start acl_ but they should never start in this way. This
+slightly messy specification is a consequence of the history, needless to say.
+
+If an ACL variable does not exist, treat it as empty, unless strict_acl_vars is
+set, in which case give an error. */
+
+if ((Ustrncmp(name, "acl_c", 5) == 0 || Ustrncmp(name, "acl_m", 5) == 0) &&
+     !isalpha(name[5]))
+  {
+  tree_node *node =
+    tree_search((name[4] == 'c')? acl_var_c : acl_var_m, name + 4);
+  return (node == NULL)? (strict_acl_vars? NULL : US"") : node->data.ptr;
+  }
+
+/* Handle $auth<n> variables. */
+
+if (Ustrncmp(name, "auth", 4) == 0)
+  {
+  uschar *endptr;
+  int n = Ustrtoul(name + 4, &endptr, 10);
+  if (*endptr == 0 && n != 0 && n <= AUTH_VARS)
+    return (auth_vars[n-1] == NULL)? US"" : auth_vars[n-1];
+  }
+
+/* For all other variables, search the table */
+
  while (last > first)
    {
    uschar *s, *domain;
@@ -1258,7 +1350,7 @@ while (last > first)
    if (c < 0) { last = middle; continue; }
  
    /* Found an existing variable. If in skipping state, the value isn't needed,
-  and we want to avoid processing (such as looking up up the host name). */
+  and we want to avoid processing (such as looking up the host name). */
  
    if (skipping) return US"";
  
@@ -1368,6 +1460,9 @@ while (last > first)
      case vtype_msgheaders:
      return find_header(NULL, exists_only, newsize, FALSE, NULL);
  
+    case vtype_msgheaders_raw:
+    return find_header(NULL, exists_only, newsize, TRUE, NULL);
+
      case vtype_msgbody:                        /* Pointer to msgbody string */
      case vtype_msgbody_end:                    /* Ditto, the end of the msg */
      ss = (uschar **)(var_table[middle].value);
@@ -1424,12 +1519,21 @@ while (last > first)
      return tod_stamp(tod_log_datestamp);
  
      case vtype_reply:                          /* Get reply address */
-    s = find_header(US"reply-to:", exists_only, newsize, FALSE,
+    s = find_header(US"reply-to:", exists_only, newsize, TRUE,
        headers_charset);
+    if (s != NULL) while (isspace(*s)) s++;
      if (s == NULL || *s == 0)
        {
        *newsize = 0;                            /* For the *s==0 case */
-      s = find_header(US"from:", exists_only, newsize, FALSE, headers_charset);
+      s = find_header(US"from:", exists_only, newsize, TRUE, headers_charset);
+      }
+    if (s != NULL)
+      {
+      uschar *t;
+      while (isspace(*s)) s++;
+      for (t = s; *t != 0; t++) if (*t == '\n') *t = ' ';
+      while (t > s && isspace(t[-1])) t--;
+      *t = 0;
        }
      return (s == NULL)? US"" : s;
  
@@ -1540,6 +1644,33 @@ return 0;
  
  
  
+/*************************************************
+*     Elaborate message for bad variable         *
+*************************************************/
+
+/* For the "unknown variable" message, take a look at the variable's name, and
+give additional information about possible ACL variables. The extra information
+is added on to expand_string_message.
+
+Argument:   the name of the variable
+Returns:    nothing
+*/
+
+static void
+check_variable_error_message(uschar *name)
+{
+if (Ustrncmp(name, "acl_", 4) == 0)
+  expand_string_message = string_sprintf("%s (%s)", expand_string_message,
+    (name[4] == 'c' || name[4] == 'm')?
+      (isalpha(name[5])?
+        US"6th character of a user-defined ACL variable must be a digit or underscore" :
+        US"strict_acl_vars is set"    /* Syntax is OK, it has to be this */
+      ) :
+      US"user-defined ACL variables must start acl_c or acl_m");
+}
+
+
+
  /*************************************************
  *        Read and evaluate a condition           *
  *************************************************/
@@ -1621,7 +1752,9 @@ switch(cond_type)
  
    s = read_name(name, 256, s+1, US"_");
  
-  /* Test for a header's existence */
+  /* Test for a header's existence. If the name contains a closing brace
+  character, this may be a user error where the terminating colon has been
+  omitted. Set a flag to adjust a subsequent error message in this case. */
  
    if (Ustrncmp(name, "h_", 2) == 0 ||
        Ustrncmp(name, "rh_", 3) == 0 ||
@@ -1631,6 +1764,7 @@ switch(cond_type)
        Ustrncmp(name, "bheader_", 8) == 0)
      {
      s = read_header_name(name, 256, s);
+    if (Ustrchr(name, '}') != NULL) malformed_header = TRUE;
      if (yield != NULL) *yield =
        (find_header(name, TRUE, NULL, FALSE, NULL) != NULL) == testfor;
      }
@@ -1646,6 +1780,7 @@ switch(cond_type)
        expand_string_message = (name[0] == 0)?
          string_sprintf("variable name omitted after \"def:\"") :
          string_sprintf("unknown variable \"%s\" after \"def:\"", name);
+      check_variable_error_message(name);
        return NULL;
        }
      if (yield != NULL) *yield = (value[0] != 0) == testfor;
@@ -1711,7 +1846,7 @@ switch(cond_type)
      case ECOND_ISIP4:
      case ECOND_ISIP6:
      rc = string_is_ip_address(sub[0], NULL);
-    *yield = ((cond_type == ECOND_ISIP)? (rc > 0) :
+    *yield = ((cond_type == ECOND_ISIP)? (rc != 0) :
               (cond_type == ECOND_ISIP4)? (rc == 4) : (rc == 6)) == testfor;
      break;
  
@@ -1856,26 +1991,18 @@ switch(cond_type)
      conditions that compare numbers do not start with a letter. This just saves
      checking for them individually. */
  
-    if (!isalpha(name[0]))
+    if (!isalpha(name[0]) && yield != NULL)
        {
-      uschar *endptr;
-      num[i] = (int)Ustrtol((const uschar *)sub[i], &endptr, 10);
-      if (tolower(*endptr) == 'k')
+      if (sub[i][0] == 0)
          {
-        num[i] *= 1024;
-        endptr++;
+        num[i] = 0;
+        DEBUG(D_expand)
+          debug_printf("empty string cast to zero for numerical comparison\n");
          }
-      else if (tolower(*endptr) == 'm')
-        {
-        num[i] *= 1024*1024;
-        endptr++;
-        }
-      while (isspace(*endptr)) endptr++;
-      if (*endptr != 0)
+      else
          {
-        expand_string_message = string_sprintf("\"%s\" is not a number",
-          sub[i]);
-        return NULL;
+        num[i] = expand_string_integer(sub[i], FALSE);
+        if (expand_string_message != NULL) return NULL;
          }
        }
      }
@@ -1971,7 +2098,7 @@ switch(cond_type)
      goto MATCHED_SOMETHING;
  
      case ECOND_MATCH_IP:       /* Match IP address in a host list */
-    if (sub[0][0] != 0 && string_is_ip_address(sub[0], NULL) <= 0)
+    if (sub[0][0] != 0 && string_is_ip_address(sub[0], NULL) == 0)
        {
        expand_string_message = string_sprintf("\"%s\" is not an IP address",
          sub[0]);
@@ -2533,8 +2660,8 @@ Returns:  pointer to string containing the last three
  static uschar *
  prvs_daystamp(int day_offset)
  {
-uschar *days = store_get(16);
-(void)string_format(days, 16, TIME_T_FMT,
+uschar *days = store_get(32);                /* Need at least 24 for cases */
+(void)string_format(days, 32, TIME_T_FMT,    /* where TIME_T_FMT is %lld */
    (time(NULL) + day_offset*86400)/86400);
  return (Ustrlen(days) >= 3) ? &days[Ustrlen(days)-3] : US"100";
  }
@@ -2664,63 +2791,53 @@ return yield;
  *          Evaluate numeric expression           *
  *************************************************/
  
-/* This is a set of mutually recursive functions that evaluate a simple
-arithmetic expression involving only + - * / and parentheses. The only one that
-is called from elsewhere is eval_expr, whose interface is:
+/* This is a set of mutually recursive functions that evaluate an arithmetic
+expression involving + - * / % & | ^ ~ << >> and parentheses. The only one of
+these functions that is called from elsewhere is eval_expr, whose interface is:
  
  Arguments:
-  sptr          pointer to the pointer to the string - gets updated
-  decimal       TRUE if numbers are to be assumed decimal
-  error         pointer to where to put an error message - must be NULL on input
-  endket        TRUE if ')' must terminate - FALSE for external call
+  sptr        pointer to the pointer to the string - gets updated
+  decimal     TRUE if numbers are to be assumed decimal
+  error       pointer to where to put an error message - must be NULL on input
+  endket      TRUE if ')' must terminate - FALSE for external call
  
-
-Returns:        on success: the value of the expression, with *error still NULL
-                on failure: an undefined value, with *error = a message
+Returns:      on success: the value of the expression, with *error still NULL
+              on failure: an undefined value, with *error = a message
  */
  
-static int eval_sumterm(uschar **, BOOL, uschar **);
+static int eval_op_or(uschar **, BOOL, uschar **);
+
  
  static int
  eval_expr(uschar **sptr, BOOL decimal, uschar **error, BOOL endket)
  {
  uschar *s = *sptr;
-int x = eval_sumterm(&s, decimal, error);
+int x = eval_op_or(&s, decimal, error);
  if (*error == NULL)
    {
-  while (*s == '+' || *s == '-')
+  if (endket)
      {
-    int op = *s++;
-    int y = eval_sumterm(&s, decimal, error);
-    if (*error != NULL) break;
-    if (op == '+') x += y; else x -= y;
-    }
-  if (*error == NULL)
-    {
-    if (endket)
-      {
-      if (*s != ')')
-        *error = US"expecting closing parenthesis";
-      else
-        while (isspace(*(++s)));
-      }
-    else if (*s != 0) *error = US"expecting + or -";
+    if (*s != ')')
+      *error = US"expecting closing parenthesis";
+    else
+      while (isspace(*(++s)));
      }
+  else if (*s != 0) *error = US"expecting operator";
    }
-
  *sptr = s;
  return x;
  }
  
+
  static int
-eval_term(uschar **sptr, BOOL decimal, uschar **error)
+eval_number(uschar **sptr, BOOL decimal, uschar **error)
  {
  register int c;
  int n;
  uschar *s = *sptr;
  while (isspace(*s)) s++;
  c = *s;
-if (isdigit(c) || ((c == '-' || c == '+') && isdigit(s[1])))
+if (isdigit(c))
    {
    int count;
    (void)sscanf(CS s, (decimal? "%d%n" : "%i%n"), &n, &count);
@@ -2743,16 +2860,38 @@ else
  return n;
  }
  
-static int eval_sumterm(uschar **sptr, BOOL decimal, uschar **error)
+
+static int eval_op_unary(uschar **sptr, BOOL decimal, uschar **error)
+{
+uschar *s = *sptr;
+int x;
+while (isspace(*s)) s++;
+if (*s == '+' || *s == '-' || *s == '~')
+  {
+  int op = *s++;
+  x = eval_op_unary(&s, decimal, error);
+  if (op == '-') x = -x;
+    else if (op == '~') x = ~x;
+  }
+else
+  {
+  x = eval_number(&s, decimal, error);
+  }
+*sptr = s;
+return x;
+}
+
+
+static int eval_op_mult(uschar **sptr, BOOL decimal, uschar **error)
  {
  uschar *s = *sptr;
-int x = eval_term(&s, decimal, error);
+int x = eval_op_unary(&s, decimal, error);
  if (*error == NULL)
    {
    while (*s == '*' || *s == '/' || *s == '%')
      {
      int op = *s++;
-    int y = eval_term(&s, decimal, error);
+    int y = eval_op_unary(&s, decimal, error);
      if (*error != NULL) break;
      if (op == '*') x *= y;
        else if (op == '/') x /= y;
@@ -2764,6 +2903,105 @@ return x;
  }
  
  
+static int eval_op_sum(uschar **sptr, BOOL decimal, uschar **error)
+{
+uschar *s = *sptr;
+int x = eval_op_mult(&s, decimal, error);
+if (*error == NULL)
+  {
+  while (*s == '+' || *s == '-')
+    {
+    int op = *s++;
+    int y = eval_op_mult(&s, decimal, error);
+    if (*error != NULL) break;
+    if (op == '+') x += y; else x -= y;
+    }
+  }
+*sptr = s;
+return x;
+}
+
+
+static int eval_op_shift(uschar **sptr, BOOL decimal, uschar **error)
+{
+uschar *s = *sptr;
+int x = eval_op_sum(&s, decimal, error);
+if (*error == NULL)
+  {
+  while ((*s == '<' || *s == '>') && s[1] == s[0])
+    {
+    int y;
+    int op = *s++;
+    s++;
+    y = eval_op_sum(&s, decimal, error);
+    if (*error != NULL) break;
+    if (op == '<') x <<= y; else x >>= y;
+    }
+  }
+*sptr = s;
+return x;
+}
+
+
+static int eval_op_and(uschar **sptr, BOOL decimal, uschar **error)
+{
+uschar *s = *sptr;
+int x = eval_op_shift(&s, decimal, error);
+if (*error == NULL)
+  {
+  while (*s == '&')
+    {
+    int y;
+    s++;
+    y = eval_op_shift(&s, decimal, error);
+    if (*error != NULL) break;
+    x &= y;
+    }
+  }
+*sptr = s;
+return x;
+}
+
+
+static int eval_op_xor(uschar **sptr, BOOL decimal, uschar **error)
+{
+uschar *s = *sptr;
+int x = eval_op_and(&s, decimal, error);
+if (*error == NULL)
+  {
+  while (*s == '^')
+    {
+    int y;
+    s++;
+    y = eval_op_and(&s, decimal, error);
+    if (*error != NULL) break;
+    x ^= y;
+    }
+  }
+*sptr = s;
+return x;
+}
+
+
+static int eval_op_or(uschar **sptr, BOOL decimal, uschar **error)
+{
+uschar *s = *sptr;
+int x = eval_op_xor(&s, decimal, error);
+if (*error == NULL)
+  {
+  while (*s == '|')
+    {
+    int y;
+    s++;
+    y = eval_op_xor(&s, decimal, error);
+    if (*error != NULL) break;
+    x |= y;
+    }
+  }
+*sptr = s;
+return x;
+}
+
  
  
  /*************************************************
@@ -2921,7 +3159,7 @@ while (*s != 0)
        value = find_header(name, FALSE, &newsize, want_raw, charset);
  
        /* If we didn't find the header, and the header contains a closing brace
-      characters, this may be a user error where the terminating colon
+      character, this may be a user error where the terminating colon
        has been omitted. Set a flag to adjust the error message in this case.
        But there is no error here - nothing gets inserted. */
  
@@ -2941,6 +3179,7 @@ while (*s != 0)
          {
          expand_string_message =
            string_sprintf("unknown variable name \"%s\"", name);
+          check_variable_error_message(name);
          goto EXPAND_FAILED;
          }
        }
@@ -3359,15 +3598,24 @@ while (*s != 0)
        domain = Ustrrchr(sub_arg[0],'@');
        if ( (domain == NULL) || (domain == sub_arg[0]) || (Ustrlen(domain) == 1) )
          {
-        expand_string_message = US"first parameter must be a qualified email address";
+        expand_string_message = US"prvs first argument must be a qualified email address";
+        goto EXPAND_FAILED;
+        }
+
+      /* Calculate the hash. The second argument must be a single-digit
+      key number, or unset. */
+
+      if (sub_arg[2] != NULL &&
+          (!isdigit(sub_arg[2][0]) || sub_arg[2][1] != 0))
+        {
+        expand_string_message = US"prvs second argument must be a single digit";
          goto EXPAND_FAILED;
          }
  
-      /* Calculate the hash */
        p = prvs_hmac_sha1(sub_arg[0],sub_arg[1],sub_arg[2],prvs_daystamp(7));
        if (p == NULL)
          {
-        expand_string_message = US"hmac-sha1 conversion failed";
+        expand_string_message = US"prvs hmac-sha1 conversion failed";
          goto EXPAND_FAILED;
          }
  
@@ -3394,18 +3642,23 @@ while (*s != 0)
        int mysize = 0, myptr = 0;
        const pcre *re;
        uschar *p;
-      /* Ugliness: We want to expand parameter 1 first, then set
+
+      /* TF: Ugliness: We want to expand parameter 1 first, then set
           up expansion variables that are used in the expansion of
           parameter 2. So we clone the string for the first
-         expansion, where we only expand paramter 1. */
-      uschar *s_backup = string_copy(s);
+         expansion, where we only expand parameter 1.
+
+         PH: Actually, that isn't necessary. The read_subs() function is
+         designed to work this way for the ${if and ${lookup expansions. I've
+         tidied the code.
+      */
  
        /* Reset expansion variables */
        prvscheck_result = NULL;
        prvscheck_address = NULL;
        prvscheck_keynum = NULL;
  
-      switch(read_subs(sub_arg, 1, 1, &s_backup, skipping, FALSE, US"prvs"))
+      switch(read_subs(sub_arg, 1, 1, &s, skipping, FALSE, US"prvs"))
          {
          case 1: goto EXPAND_FAILED_CURLY;
          case 2:
@@ -3415,7 +3668,8 @@ while (*s != 0)
        re = regex_must_compile(US"^prvs\\=(.+)\\/([0-9])([0-9]{3})([A-F0-9]{6})\\@(.+)$",
                                TRUE,FALSE);
  
-      if (regex_match_and_setup(re,sub_arg[0],0,-1)) {
+      if (regex_match_and_setup(re,sub_arg[0],0,-1))
+        {
          uschar *local_part = string_copyn(expand_nstring[1],expand_nlength[1]);
          uschar *key_num = string_copyn(expand_nstring[2],expand_nlength[2]);
          uschar *daystamp = string_copyn(expand_nstring[3],expand_nlength[3]);
@@ -3435,21 +3689,19 @@ while (*s != 0)
          prvscheck_address[myptr] = '\0';
          prvscheck_keynum = string_copy(key_num);
  
-        /* Now re-expand all arguments in the usual manner */
-        switch(read_subs(sub_arg, 3, 3, &s, skipping, TRUE, US"prvs"))
+        /* Now expand the second argument */
+        switch(read_subs(sub_arg, 1, 1, &s, skipping, FALSE, US"prvs"))
            {
            case 1: goto EXPAND_FAILED_CURLY;
            case 2:
            case 3: goto EXPAND_FAILED;
            }
  
-        if (*sub_arg[2] == '\0')
-          yield = string_cat(yield,&size,&ptr,prvscheck_address,Ustrlen(prvscheck_address));
-        else
-          yield = string_cat(yield,&size,&ptr,sub_arg[2],Ustrlen(sub_arg[2]));
-
          /* Now we have the key and can check the address. */
-        p = prvs_hmac_sha1(prvscheck_address, sub_arg[1], prvscheck_keynum, daystamp);
+
+        p = prvs_hmac_sha1(prvscheck_address, sub_arg[0], prvscheck_keynum,
+          daystamp);
+
          if (p == NULL)
            {
            expand_string_message = US"hmac-sha1 conversion failed";
@@ -3458,6 +3710,7 @@ while (*s != 0)
  
          DEBUG(D_expand) debug_printf("prvscheck: received hash is %s\n", hash);
          DEBUG(D_expand) debug_printf("prvscheck:      own hash is %s\n", p);
+
          if (Ustrcmp(p,hash) == 0)
            {
            /* Success, valid BATV address. Now check the expiry date. */
@@ -3487,12 +3740,35 @@ while (*s != 0)
            prvscheck_result = NULL;
            DEBUG(D_expand) debug_printf("prvscheck: hash failure, $pvrs_result unset\n");
            }
-      }
+
+        /* Now expand the final argument. We leave this till now so that
+        it can include $prvscheck_result. */
+
+        switch(read_subs(sub_arg, 1, 0, &s, skipping, TRUE, US"prvs"))
+          {
+          case 1: goto EXPAND_FAILED_CURLY;
+          case 2:
+          case 3: goto EXPAND_FAILED;
+          }
+
+        if (sub_arg[0] == NULL || *sub_arg[0] == '\0')
+          yield = string_cat(yield,&size,&ptr,prvscheck_address,Ustrlen(prvscheck_address));
+        else
+          yield = string_cat(yield,&size,&ptr,sub_arg[0],Ustrlen(sub_arg[0]));
+
+        /* Reset the "internal" variables afterwards, because they are in
+        dynamic store that will be reclaimed if the expansion succeeded. */
+
+        prvscheck_address = NULL;
+        prvscheck_keynum = NULL;
+        }
        else
          {
          /* Does not look like a prvs encoded address, return the empty string.
-           We need to make sure all subs are expanded first. */
-        switch(read_subs(sub_arg, 3, 3, &s, skipping, TRUE, US"prvs"))
+           We need to make sure all subs are expanded first, so as to skip over
+           the entire item. */
+
+        switch(read_subs(sub_arg, 2, 1, &s, skipping, TRUE, US"prvs"))
            {
            case 1: goto EXPAND_FAILED_CURLY;
            case 2:
@@ -3583,28 +3859,160 @@ while (*s != 0)
          }
        else sub_arg[3] = NULL;                     /* No eol if no timeout */
  
-      /* If skipping, we don't actually do anything */
+      /* If skipping, we don't actually do anything. Otherwise, arrange to
+      connect to either an IP or a Unix socket. */
  
        if (!skipping)
          {
-        /* Make a connection to the socket */
+        /* Handle an IP (internet) domain */
  
-        if ((fd = socket(PF_UNIX, SOCK_STREAM, 0)) == -1)
+        if (Ustrncmp(sub_arg[0], "inet:", 5) == 0)
            {
-          expand_string_message = string_sprintf("failed to create socket: %s",
-            strerror(errno));
-          goto SOCK_FAIL;
+          BOOL connected = FALSE;
+          int namelen, port;
+          host_item shost;
+          host_item *h;
+          uschar *server_name = sub_arg[0] + 5;
+          uschar *port_name = Ustrrchr(server_name, ':');
+
+          /* Sort out the port */
+
+          if (port_name == NULL)
+            {
+            expand_string_message =
+              string_sprintf("missing port for readsocket %s", sub_arg[0]);
+            goto EXPAND_FAILED;
+            }
+          *port_name++ = 0;           /* Terminate server name */
+
+          if (isdigit(*port_name))
+            {
+            uschar *end;
+            port = Ustrtol(port_name, &end, 0);
+            if (end != port_name + Ustrlen(port_name))
+              {
+              expand_string_message =
+                string_sprintf("invalid port number %s", port_name);
+              goto EXPAND_FAILED;
+              }
+            }
+          else
+            {
+            struct servent *service_info = getservbyname(CS port_name, "tcp");
+            if (service_info == NULL)
+              {
+              expand_string_message = string_sprintf("unknown port \"%s\"",
+                port_name);
+              goto EXPAND_FAILED;
+              }
+            port = ntohs(service_info->s_port);
+            }
+
+          /* Sort out the server. */
+
+          shost.next = NULL;
+          shost.address = NULL;
+          shost.port = port;
+          shost.mx = -1;
+
+          namelen = Ustrlen(server_name);
+
+          /* Anything enclosed in [] must be an IP address. */
+
+          if (server_name[0] == '[' &&
+              server_name[namelen - 1] == ']')
+            {
+            server_name[namelen - 1] = 0;
+            server_name++;
+            if (string_is_ip_address(server_name, NULL) == 0)
+              {
+              expand_string_message =
+                string_sprintf("malformed IP address \"%s\"", server_name);
+              goto EXPAND_FAILED;
+              }
+            shost.name = shost.address = server_name;
+            }
+
+          /* Otherwise check for an unadorned IP address */
+
+          else if (string_is_ip_address(server_name, NULL) != 0)
+            shost.name = shost.address = server_name;
+
+          /* Otherwise lookup IP address(es) from the name */
+
+          else
+            {
+            shost.name = server_name;
+            if (host_find_byname(&shost, NULL, HOST_FIND_QUALIFY_SINGLE, NULL,
+                FALSE) != HOST_FOUND)
+              {
+              expand_string_message =
+                string_sprintf("no IP address found for host %s", shost.name);
+              goto EXPAND_FAILED;
+              }
+            }
+
+          /* Try to connect to the server - test each IP till one works */
+
+          for (h = &shost; h != NULL; h = h->next)
+            {
+            int af = (Ustrchr(h->address, ':') != 0)? AF_INET6 : AF_INET;
+            if ((fd = ip_socket(SOCK_STREAM, af)) == -1)
+              {
+              expand_string_message = string_sprintf("failed to create socket: "
+                "%s", strerror(errno));
+              goto SOCK_FAIL;
+              }
+
+            if (ip_connect(fd, af, h->address, port, timeout) == 0)
+              {
+              connected = TRUE;
+              break;
+              }
+            }
+
+          if (!connected)
+            {
+            expand_string_message = string_sprintf("failed to connect to "
+              "socket %s: couldn't connect to any host", sub_arg[0],
+              strerror(errno));
+            goto SOCK_FAIL;
+            }
            }
  
-        sockun.sun_family = AF_UNIX;
-        sprintf(sockun.sun_path, "%.*s", (int)(sizeof(sockun.sun_path)-1),
-          sub_arg[0]);
-        if(connect(fd, (struct sockaddr *)(&sockun), sizeof(sockun)) == -1)
+        /* Handle a Unix domain socket */
+
+        else
            {
-          expand_string_message = string_sprintf("failed to connect to socket "
-            "%s: %s", sub_arg[0], strerror(errno));
-          goto SOCK_FAIL;
+          int rc;
+          if ((fd = socket(PF_UNIX, SOCK_STREAM, 0)) == -1)
+            {
+            expand_string_message = string_sprintf("failed to create socket: %s",
+              strerror(errno));
+            goto SOCK_FAIL;
+            }
+
+          sockun.sun_family = AF_UNIX;
+          sprintf(sockun.sun_path, "%.*s", (int)(sizeof(sockun.sun_path)-1),
+            sub_arg[0]);
+
+          sigalrm_seen = FALSE;
+          alarm(timeout);
+          rc = connect(fd, (struct sockaddr *)(&sockun), sizeof(sockun));
+          alarm(0);
+          if (sigalrm_seen)
+            {
+            expand_string_message = US "socket connect timed out";
+            goto SOCK_FAIL;
+            }
+          if (rc < 0)
+            {
+            expand_string_message = string_sprintf("failed to connect to socket "
+              "%s: %s", sub_arg[0], strerror(errno));
+            goto SOCK_FAIL;
+            }
            }
+
          DEBUG(D_expand) debug_printf("connected to socket %s\n", sub_arg[0]);
  
          /* Write the request string, if not empty */
@@ -3622,6 +4030,14 @@ while (*s != 0)
              }
            }
  
+        /* Shut down the sending side of the socket. This helps some servers to
+        recognise that it is their turn to do some work. Just in case some
+        system doesn't have this function, make it conditional. */
+
+        #ifdef SHUT_WR
+        shutdown(fd, SHUT_WR);
+        #endif
+
          /* Now we need to read from the socket, under a timeout. The function
          that reads a file can be used. */
  
@@ -3638,7 +4054,7 @@ while (*s != 0)
          if (sigalrm_seen)
            {
            ptr = save_ptr;
-          expand_string_message = US"socket read timed out";
+          expand_string_message = US "socket read timed out";
            goto SOCK_FAIL;
            }
          }
@@ -4357,6 +4773,8 @@ while (*s != 0)
          continue;
          }
  
+      /* Note that for Darwin and Cygwin, BASE_62 actually has the value 36 */
+
        case EOP_BASE62D:
          {
          uschar buf[16];
@@ -4368,10 +4786,11 @@ while (*s != 0)
            if (t == NULL)
              {
              expand_string_message = string_sprintf("argument for base62d "
-              "operator is \"%s\", which is not a base 62 number", sub);
+              "operator is \"%s\", which is not a base %d number", sub,
+              BASE_62);
              goto EXPAND_FAILED;
              }
-          n = n * 62 + (t - base62_chars);
+          n = n * BASE_62 + (t - base62_chars);
            }
          (void)sprintf(CS buf, "%ld", n);
          yield = string_cat(yield, &size, &ptr, buf, Ustrlen(buf));
@@ -4662,11 +5081,28 @@ while (*s != 0)
          {
          uschar buffer[2048];
          uschar *string = parse_quote_2047(sub, Ustrlen(sub), headers_charset,
-          buffer, sizeof(buffer));
+          buffer, sizeof(buffer), FALSE);
          yield = string_cat(yield, &size, &ptr, string, Ustrlen(string));
          continue;
          }
  
+      /* RFC 2047 decode */
+
+      case EOP_RFC2047D:
+        {
+        int len;
+        uschar *error;
+        uschar *decoded = rfc2047_decode(sub, check_rfc2047_length,
+          headers_charset, '?', &len, &error);
+        if (error != NULL)
+          {
+          expand_string_message = error;
+          goto EXPAND_FAILED;
+          }
+        yield = string_cat(yield, &size, &ptr, decoded, len);
+        continue;
+        }
+
        /* from_utf8 converts UTF-8 to 8859-1, turning non-existent chars into
        underscores */
  
@@ -4715,6 +5151,20 @@ while (*s != 0)
  
        /* Handle time period formating */
  
+      case EOP_TIME_EVAL:
+        {
+        int n = readconf_readtime(sub, 0, FALSE);
+        if (n < 0)
+          {
+          expand_string_message = string_sprintf("string \"%s\" is not an "
+            "Exim time interval in \"%s\" operator", sub, name);
+          goto EXPAND_FAILED;
+          }
+        sprintf(CS var_buffer, "%d", n);
+        yield = string_cat(yield, &size, &ptr, var_buffer, Ustrlen(var_buffer));
+        continue;
+        }
+
        case EOP_TIME_INTERVAL:
          {
          int n;
@@ -4926,6 +5376,7 @@ while (*s != 0)
        {
        expand_string_message =
          string_sprintf("unknown variable in \"${%s}\"", name);
+      check_variable_error_message(name);
        goto EXPAND_FAILED;
        }
      len = Ustrlen(value);
@@ -5051,22 +5502,26 @@ return yield;
  
  /* Expand a string, and convert the result into an integer.
  
-Argument: the string to be expanded
+Arguments:
+  string  the string to be expanded
+  isplus  TRUE if a non-negative number is expected
  
  Returns:  the integer value, or
            -1 for an expansion error               ) in both cases, message in
            -2 for an integer interpretation error  ) expand_string_message
-
+          expand_string_message is set NULL for an OK integer
  */
  
  int
-expand_string_integer(uschar *string)
+expand_string_integer(uschar *string, BOOL isplus)
  {
  long int value;
  uschar *s = expand_string(string);
  uschar *msg = US"invalid integer \"%s\"";
  uschar *endptr;
  
+/* If expansion failed, expand_string_message will be set. */
+
  if (s == NULL) return -1;
  
  /* On an overflow, strtol() returns LONG_MAX or LONG_MIN, and sets errno
@@ -5074,12 +5529,17 @@ to ERANGE. When there isn't an overflow, errno is not changed, at least on some
  systems, so we set it zero ourselves. */
  
  errno = 0;
-value = strtol(CS s, CSS &endptr, 0);
+expand_string_message = NULL;               /* Indicates no error */
+value = strtol(CS s, CSS &endptr, 10);
  
  if (endptr == s)
    {
    msg = US"integer expected but \"%s\" found";
    }
+else if (value < 0 && isplus)
+  {
+  msg = US"non-negative integer expected but \"%s\" found";
+  }
  else
    {
    /* Ensure we can cast this down to an int */