Fix validation of domain-literals in Message_ID: headers. Bug 2805

[exim.git] / src / src / parse.c
diff --git a/src/src/parse.c b/src/src/parse.c

index e0470c86f51236265d9ba67b671e420c34b77112..42f1234be8b396b3e6f3450b2be416cf431ec72f 100644 (file)
--- a/src/src/parse.c
+++ b/src/src/parse.c
@@ -65,7 +65,7 @@ Returns:   pointer past the end of the address
  */
  
  uschar *
-parse_find_address_end(uschar *s, BOOL nl_ends)
+parse_find_address_end(const uschar *s, BOOL nl_ends)
  {
  BOOL source_routing = *s == '@';
  int no_term = source_routing? 1 : 0;
@@ -121,7 +121,7 @@ while (*s != 0 && (*s != ',' || no_term > 0) && (*s != '\n' || !nl_ends))
      }
    }
  
-return s;
+return US s;
  }
  
  
@@ -224,16 +224,20 @@ If allow_domain_literals is TRUE, a "domain" may also be an IP address enclosed
  in []. Make sure the output is set to the null string if there is a syntax
  error as well as if there is no domain at all.
  
+Optionally, msg_id domain literals ( printable-ascii enclosed in [] )
+are permitted.
+
  Arguments:
    s          current character pointer
    t          where to put the domain
+  msg_id_literals     flag for relaxed domain-literal processing
    errorptr   put error message here on failure (*t will be 0 on exit)
  
  Returns:     new character pointer
  */
  
  static const uschar *
-read_domain(const uschar *s, uschar *t, uschar **errorptr)
+read_domain(const uschar *s, uschar *t, BOOL msg_id_literals, uschar **errorptr)
  {
  uschar *tt = t;
  s = skip_comment(s);
@@ -259,7 +263,11 @@ if (*s == '[')
      t += 5;
      s += 5;
      }
-  while (*s == '.' || *s == ':' || isxdigit(*s)) *t++ = *s++;
+
+  if (msg_id_literals)
+    while (*s >= 33 && *s <= 90 || *s >= 94 && *s <= 126) *t++ = *s++;
+  else
+    while (*s == '.' || *s == ':' || isxdigit(*s)) *t++ = *s++;
  
    if (*s == ']') *t++ = *s++; else
      {
@@ -267,7 +275,7 @@ if (*s == '[')
      *tt = 0;
      }
  
-  if (!allow_domain_literals)
+  if (!allow_domain_literals && !msg_id_literals)
      {
      *errorptr = US"domain literals not allowed";
      *tt = 0;
@@ -500,7 +508,7 @@ BOOL commas = FALSE;
  while (*s == '@')
    {
    *t++ = '@';
-  s = read_domain(s+1, t, errorptr);
+  s = read_domain(s+1, t, FALSE, errorptr);
    if (*t == 0) return s;
    t += Ustrlen((const uschar *)t);
    if (*s != ',') break;
@@ -559,7 +567,7 @@ if (*errorptr == NULL)
        t += Ustrlen((const uschar *)t);
        *t++ = *s++;
        *domainptr = t;
-      s = read_domain(s, t, errorptr);
+      s = read_domain(s, t, FALSE, errorptr);
        }
  return s;
  }
@@ -649,7 +657,7 @@ if (*s != '@' && *s != '<')
    {
    if (*s == 0 || *s == ';')
      {
-    if (*t == 0) FAILED(US"empty address");
+    if (!*t) FAILED(US"empty address");
      endptr = last_comment_position;
      goto PARSE_SUCCEEDED;              /* Bare local part */
      }
@@ -740,7 +748,7 @@ if (*s == '<')
      }
  
    endptr = s;
-  if (*errorptr != NULL) goto PARSE_FAILED;
+  if (*errorptr) goto PARSE_FAILED;
    while (bracket_count-- > 0) if (*s++ != '>')
      {
      *errorptr = s[-1] == 0
@@ -759,14 +767,14 @@ should be the domain. However, for flexibility we allow for a route-address
  not enclosed in <> as well, which is indicated by an empty first local
  part preceding '@'. The source routing is, however, ignored. */
  
-else if (*t == 0)
+else if (!*t)
    {
    uschar *domainptr = yield;
    s = read_route(s, t, errorptr);
-  if (*errorptr != NULL) goto PARSE_FAILED;
+  if (*errorptr) goto PARSE_FAILED;
    *t = 0;         /* Ensure route is ignored - probably overkill */
    s = read_addr_spec(s, t, 0, errorptr, &domainptr);
-  if (*errorptr != NULL) goto PARSE_FAILED;
+  if (*errorptr) goto PARSE_FAILED;
    *domain = domainptr - yield;
    endptr = last_comment_position;
    if (*domain == 0) FAILED(US"domain missing in source-routed address");
@@ -779,8 +787,8 @@ else
    t += Ustrlen((const uschar *)t);
    *t++ = *s++;
    *domain = t - yield;
-  s = read_domain(s, t, errorptr);
-  if (*t == 0) goto PARSE_FAILED;
+  s = read_domain(s, t, TRUE, errorptr);
+  if (!*t) goto PARSE_FAILED;
    endptr = last_comment_position;
    }
  
@@ -789,7 +797,7 @@ through for other cases. Endptr may have been moved over whitespace, so
  move it back past white space if necessary. */
  
  PARSE_SUCCEEDED:
-if (*s != 0)
+if (*s)
    {
    if (f.parse_found_group && *s == ';')
      {
@@ -984,12 +992,12 @@ if (i < len)
  
  /* No non-printers; use the RFC 822 quoting rules */
  
-if (!len)
+if (len <= 0 || len >= INT_MAX/4)
    {
-  return string_copy_taint(US"", is_tainted(phrase));
+  return string_copy_taint(CUS"", is_tainted(phrase));
    }
  
-buffer = store_get(len*4, is_tainted(phrase));
+buffer = store_get((len+1)*4, is_tainted(phrase));
  
  s = phrase;
  end = s + len;
@@ -1233,7 +1241,7 @@ Returns:      FF_DELIVERED      addresses extracted
  */
  
  int
-parse_forward_list(uschar *s, int options, address_item **anchor,
+parse_forward_list(const uschar *s, int options, address_item **anchor,
    uschar **error, const uschar *incoming_domain, uschar *directory,
    error_block **syntax_errors)
  {
@@ -1247,7 +1255,7 @@ for (;;)
    int special = 0;
    int specopt = 0;
    int specbit = 0;
-  uschar *ss, *nexts;
+  const uschar *ss, *nexts;
    address_item *addr;
    BOOL inquote = FALSE;
  
@@ -1275,7 +1283,7 @@ for (;;)
      syntax error has been skipped. I now think it is the wrong approach, but
      have left this here just in case, and for the record. */
  
-    #ifdef NEVER
+#ifdef NEVER
      if (count > 0) return FF_DELIVERED;   /* Something was generated */
  
      if (syntax_errors == NULL ||          /* Not skipping syntax errors, or */
@@ -1285,8 +1293,7 @@ for (;;)
      *error = string_sprintf("no addresses generated: syntax error in %s: %s",
         (*syntax_errors)->text2, (*syntax_errors)->text1);
      return FF_ERROR;
-    #endif
-
+#endif
      }
  
    /* Find the end of the next address. Quoted strings in addresses may contain
@@ -1323,13 +1330,7 @@ for (;;)
  
    len = ss - s;
  
-  DEBUG(D_route)
-    {
-    int save = s[len];
-    s[len] = 0;
-    debug_printf("extract item: %s\n", s);
-    s[len] = save;
-    }
+  DEBUG(D_route) debug_printf("extract item: %.*s\n", len, s);
  
    /* Handle special addresses if permitted. If the address is :unknown:
    ignore it - this is for backward compatibility with old alias files. You
@@ -1350,7 +1351,7 @@ for (;;)
    else if (Ustrncmp(s, ":fail:", 6) == 0)
      { special = FF_FAIL; specopt = RDO_FAIL; }  /* specbit is 0 */
  
-  if (special != 0)
+  if (special)
      {
      uschar *ss = Ustrchr(s+1, ':') + 1;
      if ((options & specopt) == specbit)
@@ -1358,10 +1359,9 @@ for (;;)
        *error = string_sprintf("\"%.*s\" is not permitted", len, s);
        return FF_ERROR;
        }
-    while (*ss != 0 && isspace(*ss)) ss++;
-    while (s[len] != 0 && s[len] != '\n') len++;
-    s[len] = 0;
-    *error = string_copy(ss);
+    while (*ss && isspace(*ss)) ss++;
+    while (s[len] && s[len] != '\n') len++;
+    *error = string_copyn(ss, s + len - ss);
      return special;
      }
  
@@ -1374,7 +1374,7 @@ for (;;)
      {
      uschar *filebuf;
      uschar filename[256];
-    uschar *t = s+9;
+    const uschar * t = s+9;
      int flen = len - 9;
      int frc;
      struct stat statbuf;
@@ -1415,12 +1415,8 @@ for (;;)
        return FF_ERROR;
        }
  
-    if (is_tainted(filename))
-      {
-      *error = string_sprintf("Tainted name '%s' for included file  not permitted\n",
-       filename);
+    if ((*error = is_tainted2(filename, 0, "Tainted name '%s' for included file not permitted\n", filename)))
        return FF_ERROR;
-      }
  
      /* Check file name if required */
  
@@ -1591,18 +1587,17 @@ for (;;)
      {
      int start, end, domain;
      const uschar *recipient = NULL;
-    int save = s[len];
-    s[len] = 0;
+    uschar * s_ltd = string_copyn(s, len);
  
      /* If it starts with \ and the rest of it parses as a valid mail address
      without a domain, carry on with that address, but qualify it with the
      incoming domain. Otherwise arrange for the address to fall through,
      causing an error message on the re-parse. */
  
-    if (*s == '\\')
+    if (*s_ltd == '\\')
        {
        recipient =
-        parse_extract_address(s+1, error, &start, &end, &domain, FALSE);
+        parse_extract_address(s_ltd+1, error, &start, &end, &domain, FALSE);
        if (recipient)
          recipient = domain != 0 ? NULL :
            string_sprintf("%s@%s", recipient, incoming_domain);
@@ -1611,17 +1606,17 @@ for (;;)
      /* Try parsing the item as an address. */
  
      if (!recipient) recipient =
-      parse_extract_address(s, error, &start, &end, &domain, FALSE);
+      parse_extract_address(s_ltd, error, &start, &end, &domain, FALSE);
  
      /* If item starts with / or | and is not a valid address, or there
      is no domain, treat it as a file or pipe. If it was a quoted item,
      remove the quoting occurrences of \ within it. */
  
-    if ((*s == '|' || *s == '/') && (recipient == NULL || domain == 0))
+    if ((*s_ltd == '|' || *s_ltd == '/') && (recipient == NULL || domain == 0))
        {
-      uschar *t = store_get(Ustrlen(s) + 1, is_tainted(s));
+      uschar *t = store_get(Ustrlen(s_ltd) + 1, is_tainted(s_ltd));
        uschar *p = t;
-      uschar *q = s;
+      uschar *q = s_ltd;
        while (*q != 0)
          {
          if (inquote)
@@ -1634,7 +1629,7 @@ for (;;)
        *p = 0;
        addr = deliver_make_addr(t, TRUE);
        setflag(addr, af_pfr);                   /* indicates pipe/file/reply */
-      if (*s != '|') setflag(addr, af_file);   /* indicates file */
+      if (*s_ltd != '|') setflag(addr, af_file);   /* indicates file */
        }
  
      /* Item must be an address. Complain if not, else qualify, rewrite and set
@@ -1646,36 +1641,33 @@ for (;;)
  
      else
        {
-      if (recipient == NULL)
+      if (!recipient)
          {
          if (Ustrcmp(*error, "empty address") == 0)
            {
            *error = NULL;
-          s[len] = save;
            s = nexts;
            continue;
            }
  
-        if (syntax_errors != NULL)
+        if (syntax_errors)
            {
            error_block *e = store_get(sizeof(error_block), FALSE);
            error_block *last = *syntax_errors;
-          if (last == NULL) *syntax_errors = e; else
+          if (!last) *syntax_errors = e; else
              {
-            while (last->next != NULL) last = last->next;
+            while (last->next) last = last->next;
              last->next = e;
              }
            e->next = NULL;
            e->text1 = *error;
-          e->text2 = string_copy(s);
-          s[len] = save;
+          e->text2 = s_ltd;
            s = nexts;
            continue;
            }
          else
            {
-          *error = string_sprintf("%s in \"%s\"", *error, s);
-          s[len] = save;   /* _after_ using it for *error */
+          *error = string_sprintf("%s in \"%s\"", *error, s_ltd);
            return FF_ERROR;
            }
          }
@@ -1690,10 +1682,8 @@ for (;;)
        addr = deliver_make_addr(US recipient, TRUE);  /* TRUE => copy recipient, so deconst ok */
        }
  
-    /* Restore the final character in the original data, and add to the
-    output chain. */
+    /* Add the original data to the output chain. */
  
-    s[len] = save;
      addr->next = *anchor;
      *anchor = addr;
      count++;