src/src/verify.c

   1 /*************************************************
   2 *     Exim - an Internet mail transport agent    *
   3 *************************************************/
   4
   5 /* Copyright (c) University of Cambridge 1995 - 2017 */
   6 /* See the file NOTICE for conditions of use and distribution. */
   7
   8 /* Functions concerned with verifying things. The original code for callout
   9 caching was contributed by Kevin Fleming (but I hacked it around a bit). */
  10
  11
  12 #include "exim.h"
  13 #include "transports/smtp.h"
  14
  15 #define CUTTHROUGH_CMD_TIMEOUT  30      /* timeout for cutthrough-routing calls */
  16 #define CUTTHROUGH_DATA_TIMEOUT 60      /* timeout for cutthrough-routing calls */
  17 static smtp_outblock ctblock;
  18 uschar ctbuffer[8192];
  19
  20
  21 /* Structure for caching DNSBL lookups */
  22
  23 typedef struct dnsbl_cache_block {
  24   time_t expiry;
  25   dns_address *rhs;
  26   uschar *text;
  27   int rc;
  28   BOOL text_set;
  29 } dnsbl_cache_block;
  30
  31
  32 /* Anchor for DNSBL cache */
  33
  34 static tree_node *dnsbl_cache = NULL;
  35
  36
  37 /* Bits for match_type in one_check_dnsbl() */
  38
  39 #define MT_NOT 1
  40 #define MT_ALL 2
  41
  42 static uschar cutthrough_response(int, char, uschar **, int);
  43
  44
  45
  46 /*************************************************
  47 *          Retrieve a callout cache record       *
  48 *************************************************/
  49
  50 /* If a record exists, check whether it has expired.
  51
  52 Arguments:
  53   dbm_file          an open hints file
  54   key               the record key
  55   type              "address" or "domain"
  56   positive_expire   expire time for positive records
  57   negative_expire   expire time for negative records
  58
  59 Returns:            the cache record if a non-expired one exists, else NULL
  60 */
  61
  62 static dbdata_callout_cache *
  63 get_callout_cache_record(open_db *dbm_file, const uschar *key, uschar *type,
  64   int positive_expire, int negative_expire)
  65 {
  66 BOOL negative;
  67 int length, expire;
  68 time_t now;
  69 dbdata_callout_cache *cache_record;
  70
  71 cache_record = dbfn_read_with_length(dbm_file, key, &length);
  72
  73 if (cache_record == NULL)
  74   {
  75   HDEBUG(D_verify) debug_printf("callout cache: no %s record found for %s\n", type, key);
  76   return NULL;
  77   }
  78
  79 /* We treat a record as "negative" if its result field is not positive, or if
  80 it is a domain record and the postmaster field is negative. */
  81
  82 negative = cache_record->result != ccache_accept ||
  83   (type[0] == 'd' && cache_record->postmaster_result == ccache_reject);
  84 expire = negative? negative_expire : positive_expire;
  85 now = time(NULL);
  86
  87 if (now - cache_record->time_stamp > expire)
  88   {
  89   HDEBUG(D_verify) debug_printf("callout cache: %s record expired for %s\n", type, key);
  90   return NULL;
  91   }
  92
  93 /* If this is a non-reject domain record, check for the obsolete format version
  94 that doesn't have the postmaster and random timestamps, by looking at the
  95 length. If so, copy it to a new-style block, replicating the record's
  96 timestamp. Then check the additional timestamps. (There's no point wasting
  97 effort if connections are rejected.) */
  98
  99 if (type[0] == 'd' && cache_record->result != ccache_reject)
 100   {
 101   if (length == sizeof(dbdata_callout_cache_obs))
 102     {
 103     dbdata_callout_cache *new = store_get(sizeof(dbdata_callout_cache));
 104     memcpy(new, cache_record, length);
 105     new->postmaster_stamp = new->random_stamp = new->time_stamp;
 106     cache_record = new;
 107     }
 108
 109   if (now - cache_record->postmaster_stamp > expire)
 110     cache_record->postmaster_result = ccache_unknown;
 111
 112   if (now - cache_record->random_stamp > expire)
 113     cache_record->random_result = ccache_unknown;
 114   }
 115
 116 HDEBUG(D_verify) debug_printf("callout cache: found %s record for %s\n", type, key);
 117 return cache_record;
 118 }
 119
 120
 121
 122 /* Check the callout cache.
 123 Options * pm_mailfrom may be modified by cache partial results.
 124
 125 Return: TRUE if result found
 126 */
 127
 128 static BOOL
 129 cached_callout_lookup(address_item * addr, uschar * address_key,
 130   uschar * from_address, int * opt_ptr, uschar ** pm_ptr,
 131   int * yield, uschar ** failure_ptr,
 132   dbdata_callout_cache * new_domain_record, int * old_domain_res)
 133 {
 134 int options = *opt_ptr;
 135 open_db dbblock;
 136 open_db *dbm_file = NULL;
 137
 138 /* Open the callout cache database, it it exists, for reading only at this
 139 stage, unless caching has been disabled. */
 140
 141 if (options & vopt_callout_no_cache)
 142   {
 143   HDEBUG(D_verify) debug_printf("callout cache: disabled by no_cache\n");
 144   }
 145 else if (!(dbm_file = dbfn_open(US"callout", O_RDWR, &dbblock, FALSE)))
 146   {
 147   HDEBUG(D_verify) debug_printf("callout cache: not available\n");
 148   }
 149 else
 150   {
 151   /* If a cache database is available see if we can avoid the need to do an
 152   actual callout by making use of previously-obtained data. */
 153
 154   dbdata_callout_cache_address * cache_address_record;
 155   dbdata_callout_cache * cache_record = get_callout_cache_record(dbm_file,
 156       addr->domain, US"domain",
 157       callout_cache_domain_positive_expire, callout_cache_domain_negative_expire);
 158
 159   /* If an unexpired cache record was found for this domain, see if the callout
 160   process can be short-circuited. */
 161
 162   if (cache_record)
 163     {
 164     /* In most cases, if an early command (up to and including MAIL FROM:<>)
 165     was rejected, there is no point carrying on. The callout fails. However, if
 166     we are doing a recipient verification with use_sender or use_postmaster
 167     set, a previous failure of MAIL FROM:<> doesn't count, because this time we
 168     will be using a non-empty sender. We have to remember this situation so as
 169     not to disturb the cached domain value if this whole verification succeeds
 170     (we don't want it turning into "accept"). */
 171
 172     *old_domain_res = cache_record->result;
 173
 174     if (  cache_record->result == ccache_reject
 175        || *from_address == 0 && cache_record->result == ccache_reject_mfnull)
 176       {
 177       setflag(addr, af_verify_nsfail);
 178       HDEBUG(D_verify)
 179         debug_printf("callout cache: domain gave initial rejection, or "
 180           "does not accept HELO or MAIL FROM:<>\n");
 181       setflag(addr, af_verify_nsfail);
 182       addr->user_message = US"(result of an earlier callout reused).";
 183       *yield = FAIL;
 184       *failure_ptr = US"mail";
 185       dbfn_close(dbm_file);
 186       return TRUE;
 187       }
 188
 189     /* If a previous check on a "random" local part was accepted, we assume
 190     that the server does not do any checking on local parts. There is therefore
 191     no point in doing the callout, because it will always be successful. If a
 192     random check previously failed, arrange not to do it again, but preserve
 193     the data in the new record. If a random check is required but hasn't been
 194     done, skip the remaining cache processing. */
 195
 196     if (options & vopt_callout_random) switch(cache_record->random_result)
 197       {
 198       case ccache_accept:
 199         HDEBUG(D_verify)
 200           debug_printf("callout cache: domain accepts random addresses\n");
 201         dbfn_close(dbm_file);
 202         return TRUE;     /* Default yield is OK */
 203
 204       case ccache_reject:
 205         HDEBUG(D_verify)
 206           debug_printf("callout cache: domain rejects random addresses\n");
 207         *opt_ptr = options & ~vopt_callout_random;
 208         new_domain_record->random_result = ccache_reject;
 209         new_domain_record->random_stamp = cache_record->random_stamp;
 210         break;
 211
 212       default:
 213         HDEBUG(D_verify)
 214           debug_printf("callout cache: need to check random address handling "
 215             "(not cached or cache expired)\n");
 216         dbfn_close(dbm_file);
 217         return FALSE;
 218       }
 219
 220     /* If a postmaster check is requested, but there was a previous failure,
 221     there is again no point in carrying on. If a postmaster check is required,
 222     but has not been done before, we are going to have to do a callout, so skip
 223     remaining cache processing. */
 224
 225     if (*pm_ptr)
 226       {
 227       if (cache_record->postmaster_result == ccache_reject)
 228         {
 229         setflag(addr, af_verify_pmfail);
 230         HDEBUG(D_verify)
 231           debug_printf("callout cache: domain does not accept "
 232             "RCPT TO:<postmaster@domain>\n");
 233         *yield = FAIL;
 234         *failure_ptr = US"postmaster";
 235         setflag(addr, af_verify_pmfail);
 236         addr->user_message = US"(result of earlier verification reused).";
 237         dbfn_close(dbm_file);
 238         return TRUE;
 239         }
 240       if (cache_record->postmaster_result == ccache_unknown)
 241         {
 242         HDEBUG(D_verify)
 243           debug_printf("callout cache: need to check RCPT "
 244             "TO:<postmaster@domain> (not cached or cache expired)\n");
 245         dbfn_close(dbm_file);
 246         return FALSE;
 247         }
 248
 249       /* If cache says OK, set pm_mailfrom NULL to prevent a redundant
 250       postmaster check if the address itself has to be checked. Also ensure
 251       that the value in the cache record is preserved (with its old timestamp).
 252       */
 253
 254       HDEBUG(D_verify) debug_printf("callout cache: domain accepts RCPT "
 255         "TO:<postmaster@domain>\n");
 256       *pm_ptr = NULL;
 257       new_domain_record->postmaster_result = ccache_accept;
 258       new_domain_record->postmaster_stamp = cache_record->postmaster_stamp;
 259       }
 260     }
 261
 262   /* We can't give a result based on information about the domain. See if there
 263   is an unexpired cache record for this specific address (combined with the
 264   sender address if we are doing a recipient callout with a non-empty sender).
 265   */
 266
 267   if (!(cache_address_record = (dbdata_callout_cache_address *)
 268     get_callout_cache_record(dbm_file, address_key, US"address",
 269       callout_cache_positive_expire, callout_cache_negative_expire)))
 270     {
 271     dbfn_close(dbm_file);
 272     return FALSE;
 273     }
 274
 275   if (cache_address_record->result == ccache_accept)
 276     {
 277     HDEBUG(D_verify)
 278       debug_printf("callout cache: address record is positive\n");
 279     }
 280   else
 281     {
 282     HDEBUG(D_verify)
 283       debug_printf("callout cache: address record is negative\n");
 284     addr->user_message = US"Previous (cached) callout verification failure";
 285     *failure_ptr = US"recipient";
 286     *yield = FAIL;
 287     }
 288
 289   /* Close the cache database while we actually do the callout for real. */
 290
 291   dbfn_close(dbm_file);
 292   return TRUE;
 293   }
 294 return FALSE;
 295 }
 296
 297
 298 /* Write results to callout cache
 299 */
 300 static void
 301 cache_callout_write(dbdata_callout_cache * dom_rec, const uschar * domain,
 302   int done, dbdata_callout_cache_address * addr_rec, uschar * address_key)
 303 {
 304 open_db dbblock;
 305 open_db *dbm_file = NULL;
 306
 307 /* If we get here with done == TRUE, a successful callout happened, and yield
 308 will be set OK or FAIL according to the response to the RCPT command.
 309 Otherwise, we looped through the hosts but couldn't complete the business.
 310 However, there may be domain-specific information to cache in both cases.
 311
 312 The value of the result field in the new_domain record is ccache_unknown if
 313 there was an error before or with MAIL FROM:, and errno was not zero,
 314 implying some kind of I/O error. We don't want to write the cache in that case.
 315 Otherwise the value is ccache_accept, ccache_reject, or ccache_reject_mfnull. */
 316
 317 if (dom_rec->result != ccache_unknown)
 318   if (!(dbm_file = dbfn_open(US"callout", O_RDWR|O_CREAT, &dbblock, FALSE)))
 319     {
 320     HDEBUG(D_verify) debug_printf("callout cache: not available\n");
 321     }
 322   else
 323     {
 324     (void)dbfn_write(dbm_file, domain, dom_rec,
 325       (int)sizeof(dbdata_callout_cache));
 326     HDEBUG(D_verify) debug_printf("wrote callout cache domain record for %s:\n"
 327       "  result=%d postmaster=%d random=%d\n",
 328       domain,
 329       dom_rec->result,
 330       dom_rec->postmaster_result,
 331       dom_rec->random_result);
 332     }
 333
 334 /* If a definite result was obtained for the callout, cache it unless caching
 335 is disabled. */
 336
 337 if (done  &&  addr_rec->result != ccache_unknown)
 338   {
 339   if (!dbm_file)
 340     dbm_file = dbfn_open(US"callout", O_RDWR|O_CREAT, &dbblock, FALSE);
 341   if (!dbm_file)
 342     {
 343     HDEBUG(D_verify) debug_printf("no callout cache available\n");
 344     }
 345   else
 346     {
 347     (void)dbfn_write(dbm_file, address_key, addr_rec,
 348       (int)sizeof(dbdata_callout_cache_address));
 349     HDEBUG(D_verify) debug_printf("wrote %s callout cache address record for %s\n",
 350       addr_rec->result == ccache_accept ? "positive" : "negative",
 351       address_key);
 352     }
 353   }
 354
 355 if (dbm_file) dbfn_close(dbm_file);
 356 }
 357
 358
 359 /* Cutthrough-multi.  If the existing cached cutthrough connection matches
 360 the one we would make for a subsequent recipient, use it.  Send the RCPT TO
 361 and check the result, nonpipelined as it may be wanted immediately for
 362 recipient-verification.
 363
 364 It seems simpler to deal with this case separately from the main callout loop.
 365 We will need to remember it has sent, or not, so that rcpt-acl tail code
 366 can do it there for the non-rcpt-verify case.  For this we keep an addresscount.
 367
 368 Return: TRUE for a definitive result for the recipient
 369 */
 370 static int
 371 cutthrough_multi(address_item * addr, host_item * host_list,
 372   transport_feedback * tf, int * yield)
 373 {
 374 BOOL done = FALSE;
 375 host_item * host;
 376
 377 if (addr->transport == cutthrough.addr.transport)
 378   for (host = host_list; host; host = host->next)
 379     if (Ustrcmp(host->address, cutthrough.host.address) == 0)
 380       {
 381       int host_af;
 382       uschar *interface = NULL;  /* Outgoing interface to use; NULL => any */
 383       int port = 25;
 384
 385       deliver_host = host->name;
 386       deliver_host_address = host->address;
 387       deliver_host_port = host->port;
 388       deliver_domain = addr->domain;
 389       transport_name = addr->transport->name;
 390
 391       host_af = Ustrchr(host->address, ':') ? AF_INET6 : AF_INET;
 392
 393       if (!smtp_get_interface(tf->interface, host_af, addr, &interface,
 394               US"callout") ||
 395           !smtp_get_port(tf->port, addr, &port, US"callout"))
 396         log_write(0, LOG_MAIN|LOG_PANIC, "<%s>: %s", addr->address,
 397           addr->message);
 398
 399       if (  (  interface == cutthrough.interface
 400             || (  interface
 401                && cutthrough.interface
 402                && Ustrcmp(interface, cutthrough.interface) == 0
 403             )  )
 404          && port == cutthrough.host.port
 405          )
 406         {
 407         uschar * resp = NULL;
 408
 409         /* Match!  Send the RCPT TO, set done from the response */
 410         done =
 411           smtp_write_command(&ctblock, SCMD_FLUSH, "RCPT TO:<%.1000s>\r\n",
 412             transport_rcpt_address(addr,
 413                addr->transport->rcpt_include_affixes)) >= 0 &&
 414           cutthrough_response(cutthrough.fd, '2', &resp, CUTTHROUGH_DATA_TIMEOUT) == '2';
 415
 416         /* This would go horribly wrong if a callout fail was ignored by ACL.
 417         We punt by abandoning cutthrough on a reject, like the
 418         first-rcpt does. */
 419
 420         if (done)
 421           {
 422           address_item * na = store_get(sizeof(address_item));
 423           *na = cutthrough.addr;
 424           cutthrough.addr = *addr;
 425           cutthrough.addr.host_used = &cutthrough.host;
 426           cutthrough.addr.next = na;
 427
 428           cutthrough.nrcpt++;
 429           }
 430         else
 431           {
 432           cancel_cutthrough_connection(TRUE, US"recipient rejected");
 433           if (!resp || errno == ETIMEDOUT)
 434             {
 435             HDEBUG(D_verify) debug_printf("SMTP timeout\n");
 436             }
 437           else if (errno == 0)
 438             {
 439             if (*resp == 0)
 440               Ustrcpy(resp, US"connection dropped");
 441
 442             addr->message =
 443               string_sprintf("response to \"%s\" was: %s",
 444                 big_buffer, string_printing(resp));
 445
 446             addr->user_message =
 447               string_sprintf("Callout verification failed:\n%s", resp);
 448
 449             /* Hard rejection ends the process */
 450
 451             if (resp[0] == '5')   /* Address rejected */
 452               {
 453               *yield = FAIL;
 454               done = TRUE;
 455               }
 456             }
 457           }
 458         }
 459       break;    /* host_list */
 460       }
 461 if (!done)
 462   cancel_cutthrough_connection(TRUE, US"incompatible connection");
 463 return done;
 464 }
 465
 466
 467 /*************************************************
 468 *      Do callout verification for an address    *
 469 *************************************************/
 470
 471 /* This function is called from verify_address() when the address has routed to
 472 a host list, and a callout has been requested. Callouts are expensive; that is
 473 why a cache is used to improve the efficiency.
 474
 475 Arguments:
 476   addr              the address that's been routed
 477   host_list         the list of hosts to try
 478   tf                the transport feedback block
 479
 480   ifstring          "interface" option from transport, or NULL
 481   portstring        "port" option from transport, or NULL
 482   protocolstring    "protocol" option from transport, or NULL
 483   callout           the per-command callout timeout
 484   callout_overall   the overall callout timeout (if < 0 use 4*callout)
 485   callout_connect   the callout connection timeout (if < 0 use callout)
 486   options           the verification options - these bits are used:
 487                       vopt_is_recipient => this is a recipient address
 488                       vopt_callout_no_cache => don't use callout cache
 489                       vopt_callout_fullpm => if postmaster check, do full one
 490                       vopt_callout_random => do the "random" thing
 491                       vopt_callout_recipsender => use real sender for recipient
 492                       vopt_callout_recippmaster => use postmaster for recipient
 493                       vopt_callout_hold         => lazy close connection
 494   se_mailfrom         MAIL FROM address for sender verify; NULL => ""
 495   pm_mailfrom         if non-NULL, do the postmaster check with this sender
 496
 497 Returns:            OK/FAIL/DEFER
 498 */
 499
 500 static int
 501 do_callout(address_item *addr, host_item *host_list, transport_feedback *tf,
 502   int callout, int callout_overall, int callout_connect, int options,
 503   uschar *se_mailfrom, uschar *pm_mailfrom)
 504 {
 505 int yield = OK;
 506 int old_domain_cache_result = ccache_accept;
 507 BOOL done = FALSE;
 508 uschar *address_key;
 509 uschar *from_address;
 510 uschar *random_local_part = NULL;
 511 const uschar *save_deliver_domain = deliver_domain;
 512 uschar **failure_ptr = options & vopt_is_recipient
 513   ? &recipient_verify_failure : &sender_verify_failure;
 514 dbdata_callout_cache new_domain_record;
 515 dbdata_callout_cache_address new_address_record;
 516 time_t callout_start_time;
 517
 518 new_domain_record.result = ccache_unknown;
 519 new_domain_record.postmaster_result = ccache_unknown;
 520 new_domain_record.random_result = ccache_unknown;
 521
 522 memset(&new_address_record, 0, sizeof(new_address_record));
 523
 524 /* For a recipient callout, the key used for the address cache record must
 525 include the sender address if we are using the real sender in the callout,
 526 because that may influence the result of the callout. */
 527
 528 if (options & vopt_is_recipient)
 529   if (options & vopt_callout_recipsender)
 530     {
 531     from_address = sender_address;
 532     address_key = string_sprintf("%s/<%s>", addr->address, sender_address);
 533     if (cutthrough.delivery) options |= vopt_callout_no_cache;
 534     }
 535   else if (options & vopt_callout_recippmaster)
 536     {
 537     from_address = string_sprintf("postmaster@%s", qualify_domain_sender);
 538     address_key = string_sprintf("%s/<postmaster@%s>", addr->address,
 539       qualify_domain_sender);
 540     }
 541   else
 542     {
 543     from_address = US"";
 544     address_key = addr->address;
 545     }
 546
 547 /* For a sender callout, we must adjust the key if the mailfrom address is not
 548 empty. */
 549
 550 else
 551   {
 552   from_address = se_mailfrom ? se_mailfrom : US"";
 553   address_key = *from_address
 554     ? string_sprintf("%s/<%s>", addr->address, from_address) : addr->address;
 555   }
 556
 557 if (cached_callout_lookup(addr, address_key, from_address,
 558       &options, &pm_mailfrom, &yield, failure_ptr,
 559       &new_domain_record, &old_domain_cache_result))
 560   {
 561   cancel_cutthrough_connection(TRUE, US"cache-hit");
 562   goto END_CALLOUT;
 563   }
 564
 565 if (!addr->transport)
 566   {
 567   HDEBUG(D_verify) debug_printf("cannot callout via null transport\n");
 568   }
 569 else if (Ustrcmp(addr->transport->driver_name, "smtp") != 0)
 570   log_write(0, LOG_MAIN|LOG_PANIC|LOG_CONFIG_FOR, "callout transport '%s': %s is non-smtp",
 571     addr->transport->name, addr->transport->driver_name);
 572 else
 573   {
 574   smtp_transport_options_block *ob =
 575     (smtp_transport_options_block *)addr->transport->options_block;
 576   host_item * host;
 577
 578   /* The information wasn't available in the cache, so we have to do a real
 579   callout and save the result in the cache for next time, unless no_cache is set,
 580   or unless we have a previously cached negative random result. If we are to test
 581   with a random local part, ensure that such a local part is available. If not,
 582   log the fact, but carry on without randomising. */
 583
 584   if (options & vopt_callout_random  &&  callout_random_local_part)
 585     if (!(random_local_part = expand_string(callout_random_local_part)))
 586       log_write(0, LOG_MAIN|LOG_PANIC, "failed to expand "
 587         "callout_random_local_part: %s", expand_string_message);
 588
 589   /* Default the connect and overall callout timeouts if not set, and record the
 590   time we are starting so that we can enforce it. */
 591
 592   if (callout_overall < 0) callout_overall = 4 * callout;
 593   if (callout_connect < 0) callout_connect = callout;
 594   callout_start_time = time(NULL);
 595
 596   /* Before doing a real callout, if this is an SMTP connection, flush the SMTP
 597   output because a callout might take some time. When PIPELINING is active and
 598   there are many recipients, the total time for doing lots of callouts can add up
 599   and cause the client to time out. So in this case we forgo the PIPELINING
 600   optimization. */
 601
 602   if (smtp_out && !disable_callout_flush) mac_smtp_fflush();
 603
 604   clearflag(addr, af_verify_pmfail);  /* postmaster callout flag */
 605   clearflag(addr, af_verify_nsfail);  /* null sender callout flag */
 606
 607 /* cutthrough-multi: if a nonfirst rcpt has the same routing as the first,
 608 and we are holding a cutthrough conn open, we can just append the rcpt to
 609 that conn for verification purposes (and later delivery also).  Simplest
 610 coding means skipping this whole loop and doing the append separately.  */
 611
 612   /* Can we re-use an open cutthrough connection? */
 613   if (  cutthrough.fd >= 0
 614      && (options & (vopt_callout_recipsender | vopt_callout_recippmaster))
 615         == vopt_callout_recipsender
 616      && !random_local_part
 617      && !pm_mailfrom
 618      )
 619     done = cutthrough_multi(addr, host_list, tf, &yield);
 620
 621   /* If we did not use a cached connection, make connections to the hosts
 622   and do real callouts. The list of hosts is passed in as an argument. */
 623
 624   for (host = host_list; host && !done; host = host->next)
 625     {
 626     int host_af;
 627     int port = 25;
 628     uschar *interface = NULL;  /* Outgoing interface to use; NULL => any */
 629     smtp_context sx;
 630
 631     if (!host->address)
 632       {
 633       DEBUG(D_verify) debug_printf("no IP address for host name %s: skipping\n",
 634         host->name);
 635       continue;
 636       }
 637
 638     /* Check the overall callout timeout */
 639
 640     if (time(NULL) - callout_start_time >= callout_overall)
 641       {
 642       HDEBUG(D_verify) debug_printf("overall timeout for callout exceeded\n");
 643       break;
 644       }
 645
 646     /* Set IPv4 or IPv6 */
 647
 648     host_af = Ustrchr(host->address, ':') ? AF_INET6 : AF_INET;
 649
 650     /* Expand and interpret the interface and port strings. The latter will not
 651     be used if there is a host-specific port (e.g. from a manualroute router).
 652     This has to be delayed till now, because they may expand differently for
 653     different hosts. If there's a failure, log it, but carry on with the
 654     defaults. */
 655
 656     deliver_host = host->name;
 657     deliver_host_address = host->address;
 658     deliver_host_port = host->port;
 659     deliver_domain = addr->domain;
 660     transport_name = addr->transport->name;
 661
 662     if (  !smtp_get_interface(tf->interface, host_af, addr, &interface,
 663             US"callout")
 664        || !smtp_get_port(tf->port, addr, &port, US"callout")
 665        )
 666       log_write(0, LOG_MAIN|LOG_PANIC, "<%s>: %s", addr->address,
 667         addr->message);
 668
 669     sx.addrlist = addr;
 670     sx.host = host;
 671     sx.host_af = host_af,
 672     sx.port = port;
 673     sx.interface = interface;
 674     sx.helo_data = tf->helo_data;
 675     sx.tblock = addr->transport;
 676     sx.verify = TRUE;
 677
 678 tls_retry_connection:
 679     /* Set the address state so that errors are recorded in it */
 680
 681     addr->transport_return = PENDING_DEFER;
 682     ob->connect_timeout = callout_connect;
 683     ob->command_timeout = callout;
 684
 685     /* Get the channel set up ready for a message (MAIL FROM being the next
 686     SMTP command to send.  If we tried TLS but it failed, try again without
 687     if permitted */
 688
 689     yield = smtp_setup_conn(&sx, FALSE);
 690 #ifdef SUPPORT_TLS
 691     if (  yield == DEFER
 692        && addr->basic_errno == ERRNO_TLSFAILURE
 693        && ob->tls_tempfail_tryclear
 694        && verify_check_given_host(&ob->hosts_require_tls, host) != OK
 695        )
 696       {
 697       log_write(0, LOG_MAIN,
 698         "%s: callout unencrypted to %s [%s] (not in hosts_require_tls)",
 699         addr->message, host->name, host->address);
 700       addr->transport_return = PENDING_DEFER;
 701       yield = smtp_setup_conn(&sx, TRUE);
 702       }
 703 #endif
 704     if (yield != OK)
 705       {
 706       errno = addr->basic_errno;
 707       transport_name = NULL;
 708       deliver_host = deliver_host_address = NULL;
 709       deliver_domain = save_deliver_domain;
 710
 711       /* Failure to accept HELO is cached; this blocks the whole domain for all
 712       senders. I/O errors and defer responses are not cached. */
 713
 714       if (yield == FAIL && (errno == 0 || errno == ERRNO_SMTPCLOSED))
 715         {
 716         setflag(addr, af_verify_nsfail);
 717         new_domain_record.result = ccache_reject;
 718         done = TRUE;
 719         }
 720       else
 721         done = FALSE;
 722       goto no_conn;
 723       }
 724
 725     /* If we needed to authenticate, smtp_setup_conn() did that.  Copy
 726     the AUTH info for logging */
 727
 728     addr->authenticator = client_authenticator;
 729     addr->auth_id = client_authenticated_id;
 730
 731     sx.from_addr = from_address;
 732     sx.first_addr = sx.sync_addr = addr;
 733     sx.ok = FALSE;                      /*XXX these 3 last might not be needed for verify? */
 734     sx.send_rset = TRUE;
 735     sx.completed_addr = FALSE;
 736
 737     new_domain_record.result = old_domain_cache_result == ccache_reject_mfnull
 738       ? ccache_reject_mfnull : ccache_accept;
 739
 740     /* Do the random local part check first. Temporarily replace the recipient
 741     with the "random" value */
 742
 743     if (random_local_part)
 744       {
 745       uschar * main_address = addr->address;
 746       const uschar * rcpt_domain = addr->domain;
 747
 748 #ifdef SUPPORT_I18N
 749       uschar * errstr = NULL;
 750       if (  testflag(addr, af_utf8_downcvt)
 751          && (rcpt_domain = string_domain_utf8_to_alabel(rcpt_domain,
 752                                     &errstr), errstr)
 753          )
 754         {
 755         addr->message = errstr;
 756         errno = ERRNO_EXPANDFAIL;
 757         setflag(addr, af_verify_nsfail);
 758         done = FALSE;
 759         rcpt_domain = US"";  /*XXX errorhandling! */
 760         }
 761 #endif
 762
 763       /* This would be ok for 1st rcpt of a cutthrough (the case handled here;
 764       subsequents are done in cutthrough_multi()), but no way to
 765       handle a subsequent because of the RSET vaporising the MAIL FROM.
 766       So refuse to support any.  Most cutthrough use will not involve
 767       random_local_part, so no loss. */
 768       cancel_cutthrough_connection(TRUE, US"random-recipient");
 769
 770       addr->address = string_sprintf("%s@%.1000s",
 771                                     random_local_part, rcpt_domain);
 772       done = FALSE;
 773
 774       /* If accepted, we aren't going to do any further tests below.
 775       Otherwise, cache a real negative response, and get back to the right
 776       state to send RCPT. Unless there's some problem such as a dropped
 777       connection, we expect to succeed, because the commands succeeded above.
 778       However, some servers drop the connection after responding to an
 779       invalid recipient, so on (any) error we drop and remake the connection.
 780       XXX We don't care about that for postmaster_full.  Should we?
 781
 782       XXX could we add another flag to the context, and have the common
 783       code emit the RSET too?  Even pipelined after the RCPT...
 784       Then the main-verify call could use it if there's to be a subsequent
 785       postmaster-verify.
 786       The sync_responses() would need to be taught about it and we'd
 787       need another return code filtering out to here.
 788       */
 789
 790       /* Remember when we last did a random test */
 791       new_domain_record.random_stamp = time(NULL);
 792
 793       if (smtp_write_mail_and_rcpt_cmds(&sx, &yield) == 0)
 794         switch(addr->transport_return)
 795           {
 796           case PENDING_OK:
 797             new_domain_record.random_result = ccache_accept;
 798             break;
 799           case FAIL:
 800             new_domain_record.random_result = ccache_reject;
 801
 802             /* Between each check, issue RSET, because some servers accept only
 803             one recipient after MAIL FROM:<>.
 804             XXX We don't care about that for postmaster_full.  Should we? */
 805
 806             if ((done =
 807               smtp_write_command(&sx.outblock, SCMD_FLUSH, "RSET\r\n") >= 0 &&
 808               smtp_read_response(&sx.inblock, sx.buffer, sizeof(sx.buffer),
 809                 '2', callout)))
 810               break;
 811
 812             HDEBUG(D_acl|D_v)
 813               debug_printf_indent("problem after random/rset/mfrom; reopen conn\n");
 814             random_local_part = NULL;
 815 #ifdef SUPPORT_TLS
 816             tls_close(FALSE, TRUE);
 817 #endif
 818             HDEBUG(D_transport|D_acl|D_v) debug_printf_indent("  SMTP(close)>>\n");
 819             (void)close(sx.inblock.sock);
 820             sx.inblock.sock = sx.outblock.sock = -1;
 821 #ifndef DISABLE_EVENT
 822             (void) event_raise(addr->transport->event_action,
 823                               US"tcp:close", NULL);
 824 #endif
 825             addr->address = main_address;
 826             addr->transport_return = PENDING_DEFER;
 827             sx.first_addr = sx.sync_addr = addr;
 828             sx.ok = FALSE;
 829             sx.send_rset = TRUE;
 830             sx.completed_addr = FALSE;
 831             goto tls_retry_connection;
 832           }
 833
 834       /* Re-setup for main verify, or for the error message when failing */
 835       addr->address = main_address;
 836       addr->transport_return = PENDING_DEFER;
 837       sx.first_addr = sx.sync_addr = addr;
 838       sx.ok = FALSE;
 839       sx.send_rset = TRUE;
 840       sx.completed_addr = FALSE;
 841       }
 842     else
 843       done = TRUE;
 844
 845     /* Main verify. If the host is accepting all local parts, as determined
 846     by the "random" check, we don't need to waste time doing any further
 847     checking. */
 848
 849     if (done)
 850       {
 851       done = FALSE;
 852       switch(smtp_write_mail_and_rcpt_cmds(&sx, &yield))
 853         {
 854         case 0:  switch(addr->transport_return) /* ok so far */
 855                     {
 856                     case PENDING_OK:  done = TRUE;
 857                                       new_address_record.result = ccache_accept;
 858                                       break;
 859                     case FAIL:        done = TRUE;
 860                                       yield = FAIL;
 861                                       *failure_ptr = US"recipient";
 862                                       new_address_record.result = ccache_reject;
 863                                       break;
 864                     default:          break;
 865                     }
 866                   break;
 867
 868         case -1:                                /* MAIL response error */
 869                   *failure_ptr = US"mail";
 870                   if (errno == 0 && sx.buffer[0] == '5')
 871                     {
 872                     setflag(addr, af_verify_nsfail);
 873                     if (from_address[0] == 0)
 874                       new_domain_record.result = ccache_reject_mfnull;
 875                     }
 876                   break;
 877                                                 /* non-MAIL read i/o error */
 878                                                 /* non-MAIL response timeout */
 879                                                 /* internal error; channel still usable */
 880         default:  break;                        /* transmit failed */
 881         }
 882       }
 883
 884     addr->auth_sndr = client_authenticated_sender;
 885
 886     deliver_host = deliver_host_address = NULL;
 887     deliver_domain = save_deliver_domain;
 888
 889     /* Do postmaster check if requested; if a full check is required, we
 890     check for RCPT TO:<postmaster> (no domain) in accordance with RFC 821. */
 891
 892     if (done && pm_mailfrom)
 893       {
 894       /* Could possibly shift before main verify, just above, and be ok
 895       for cutthrough.  But no way to handle a subsequent rcpt, so just
 896       refuse any */
 897       cancel_cutthrough_connection(TRUE, US"postmaster verify");
 898       HDEBUG(D_acl|D_v) debug_printf_indent("Cutthrough cancelled by presence of postmaster verify\n");
 899
 900       done = smtp_write_command(&sx.outblock, SCMD_FLUSH, "RSET\r\n") >= 0
 901           && smtp_read_response(&sx.inblock, sx.buffer,
 902                                 sizeof(sx.buffer), '2', callout);
 903
 904       if (done)
 905         {
 906         uschar * main_address = addr->address;
 907
 908         /*XXX oops, affixes */
 909         addr->address = string_sprintf("postmaster@%.1000s", addr->domain);
 910         addr->transport_return = PENDING_DEFER;
 911
 912         sx.from_addr = pm_mailfrom;
 913         sx.first_addr = sx.sync_addr = addr;
 914         sx.ok = FALSE;
 915         sx.send_rset = TRUE;
 916         sx.completed_addr = FALSE;
 917
 918         if(  smtp_write_mail_and_rcpt_cmds(&sx, &yield) == 0
 919           && addr->transport_return == PENDING_OK
 920           )
 921           done = TRUE;
 922         else
 923           done = (options & vopt_callout_fullpm) != 0
 924               && smtp_write_command(&sx.outblock, SCMD_FLUSH,
 925                             "RCPT TO:<postmaster>\r\n") >= 0
 926               && smtp_read_response(&sx.inblock, sx.buffer,
 927                             sizeof(sx.buffer), '2', callout);
 928
 929         /* Sort out the cache record */
 930
 931         new_domain_record.postmaster_stamp = time(NULL);
 932
 933         if (done)
 934           new_domain_record.postmaster_result = ccache_accept;
 935         else if (errno == 0 && sx.buffer[0] == '5')
 936           {
 937           *failure_ptr = US"postmaster";
 938           setflag(addr, af_verify_pmfail);
 939           new_domain_record.postmaster_result = ccache_reject;
 940           }
 941
 942         addr->address = main_address;
 943         }
 944       }
 945     /* For any failure of the main check, other than a negative response, we just
 946     close the connection and carry on. We can identify a negative response by the
 947     fact that errno is zero. For I/O errors it will be non-zero
 948
 949     Set up different error texts for logging and for sending back to the caller
 950     as an SMTP response. Log in all cases, using a one-line format. For sender
 951     callouts, give a full response to the caller, but for recipient callouts,
 952     don't give the IP address because this may be an internal host whose identity
 953     is not to be widely broadcast. */
 954
 955 no_conn:
 956     switch(errno)
 957       {
 958       case ETIMEDOUT:
 959         HDEBUG(D_verify) debug_printf("SMTP timeout\n");
 960         sx.send_quit = FALSE;
 961         break;
 962
 963 #ifdef SUPPORT_I18N
 964       case ERRNO_UTF8_FWD:
 965         {
 966         extern int acl_where;   /* src/acl.c */
 967         errno = 0;
 968         addr->message = string_sprintf(
 969             "response to \"EHLO\" did not include SMTPUTF8");
 970         addr->user_message = acl_where == ACL_WHERE_RCPT
 971           ? US"533 no support for internationalised mailbox name"
 972           : US"550 mailbox unavailable";
 973         yield = FAIL;
 974         done = TRUE;
 975         }
 976         break;
 977 #endif
 978       case ECONNREFUSED:
 979         sx.send_quit = FALSE;
 980         break;
 981
 982       case 0:
 983         if (*sx.buffer == 0) Ustrcpy(sx.buffer, US"connection dropped");
 984
 985         /*XXX test here is ugly; seem to have a split of responsibility for
 986         building this message.  Need to reationalise.  Where is it done
 987         before here, and when not?
 988         Not == 5xx resp to MAIL on main-verify
 989         */
 990         if (!addr->message) addr->message =
 991           string_sprintf("response to \"%s\" was: %s",
 992                           big_buffer, string_printing(sx.buffer));
 993
 994         addr->user_message = options & vopt_is_recipient
 995           ? string_sprintf("Callout verification failed:\n%s", sx.buffer)
 996           : string_sprintf("Called:   %s\nSent:     %s\nResponse: %s",
 997             host->address, big_buffer, sx.buffer);
 998
 999         /* Hard rejection ends the process */
1000
1001         if (sx.buffer[0] == '5')   /* Address rejected */
1002           {
1003           yield = FAIL;
1004           done = TRUE;
1005           }
1006         break;
1007       }
1008
1009     /* End the SMTP conversation and close the connection. */
1010
1011     /* Cutthrough - on a successful connect and recipient-verify with
1012     use-sender and we are 1st rcpt and have no cutthrough conn so far
1013     here is where we want to leave the conn open.  Ditto for a lazy-close
1014     verify. */
1015
1016     if (  (cutthrough.delivery || options & vopt_callout_hold)
1017        && rcpt_count == 1
1018        && done
1019        && yield == OK
1020        &&    (options & (vopt_callout_recipsender|vopt_callout_recippmaster|vopt_success_on_redirect))
1021            == vopt_callout_recipsender
1022        && !random_local_part
1023        && !pm_mailfrom
1024        && cutthrough.fd < 0
1025        && !sx.lmtp
1026        )
1027       {
1028       HDEBUG(D_acl|D_v) debug_printf_indent("holding verify callout open for %s\n",
1029         cutthrough.delivery
1030         ? "cutthrough delivery" : "potential further verifies and delivery");
1031
1032       cutthrough.callout_hold_only = !cutthrough.delivery;
1033       cutthrough.is_tls =       tls_out.active >= 0;
1034       cutthrough.fd =   sx.outblock.sock;       /* We assume no buffer in use in the outblock */
1035       cutthrough.nrcpt =        1;
1036       cutthrough.transport =    addr->transport->name;
1037       cutthrough.interface =    interface;
1038       cutthrough.snd_port =     sending_port;
1039       cutthrough.peer_options = smtp_peer_options;
1040       cutthrough.host =         *host;
1041         {
1042         int oldpool = store_pool;
1043         store_pool = POOL_PERM;
1044         cutthrough.snd_ip = string_copy(sending_ip_address);
1045         cutthrough.host.name = string_copy(host->name);
1046         cutthrough.host.address = string_copy(host->address);
1047         store_pool = oldpool;
1048         }
1049       cutthrough.addr =         *addr;          /* Save the address_item for later logging */
1050       cutthrough.addr.next =    NULL;
1051       cutthrough.addr.host_used = &cutthrough.host;
1052       if (addr->parent)
1053         *(cutthrough.addr.parent = store_get(sizeof(address_item))) =
1054           *addr->parent;
1055       ctblock.buffer = ctbuffer;
1056       ctblock.buffersize = sizeof(ctbuffer);
1057       ctblock.ptr = ctbuffer;
1058       /* ctblock.cmd_count = 0; ctblock.authenticating = FALSE; */
1059       ctblock.sock = cutthrough.fd;
1060       }
1061     else
1062       {
1063       /* Ensure no cutthrough on multiple verifies that were incompatible */
1064       if (options & vopt_callout_recipsender)
1065         cancel_cutthrough_connection(TRUE, US"not usable for cutthrough");
1066       if (sx.send_quit)
1067         {
1068         (void) smtp_write_command(&sx.outblock, SCMD_FLUSH, "QUIT\r\n");
1069
1070         /* Wait a short time for response, and discard it */
1071         smtp_read_response(&sx.inblock, sx.buffer, sizeof(sx.buffer),
1072           '2', 1);
1073         }
1074
1075       if (sx.inblock.sock >= 0)
1076         {
1077 #ifdef SUPPORT_TLS
1078         tls_close(FALSE, TRUE);
1079 #endif
1080         HDEBUG(D_transport|D_acl|D_v) debug_printf_indent("  SMTP(close)>>\n");
1081         (void)close(sx.inblock.sock);
1082         sx.inblock.sock = sx.outblock.sock = -1;
1083 #ifndef DISABLE_EVENT
1084         (void) event_raise(addr->transport->event_action, US"tcp:close", NULL);
1085 #endif
1086         }
1087       }
1088
1089     if (!done || yield != OK)
1090       addr->message = string_sprintf("%s [%s] : %s", host->name, host->address,
1091                                     addr->message);
1092     }    /* Loop through all hosts, while !done */
1093   }
1094
1095 /* If we get here with done == TRUE, a successful callout happened, and yield
1096 will be set OK or FAIL according to the response to the RCPT command.
1097 Otherwise, we looped through the hosts but couldn't complete the business.
1098 However, there may be domain-specific information to cache in both cases. */
1099
1100 if (!(options & vopt_callout_no_cache))
1101   cache_callout_write(&new_domain_record, addr->domain,
1102     done, &new_address_record, address_key);
1103
1104 /* Failure to connect to any host, or any response other than 2xx or 5xx is a
1105 temporary error. If there was only one host, and a response was received, leave
1106 it alone if supplying details. Otherwise, give a generic response. */
1107
1108 if (!done)
1109   {
1110   uschar * dullmsg = string_sprintf("Could not complete %s verify callout",
1111     options & vopt_is_recipient ? "recipient" : "sender");
1112   yield = DEFER;
1113
1114   addr->message = host_list->next || !addr->message
1115     ? dullmsg : string_sprintf("%s: %s", dullmsg, addr->message);
1116
1117   addr->user_message = smtp_return_error_details
1118     ? string_sprintf("%s for <%s>.\n"
1119       "The mail server(s) for the domain may be temporarily unreachable, or\n"
1120       "they may be permanently unreachable from this server. In the latter case,\n%s",
1121       dullmsg, addr->address,
1122       options & vopt_is_recipient
1123         ? "the address will never be accepted."
1124         : "you need to change the address or create an MX record for its domain\n"
1125           "if it is supposed to be generally accessible from the Internet.\n"
1126           "Talk to your mail administrator for details.")
1127     : dullmsg;
1128
1129   /* Force a specific error code */
1130
1131   addr->basic_errno = ERRNO_CALLOUTDEFER;
1132   }
1133
1134 /* Come here from within the cache-reading code on fast-track exit. */
1135
1136 END_CALLOUT:
1137 tls_modify_variables(&tls_in);
1138 return yield;
1139 }
1140
1141
1142
1143 /* Called after recipient-acl to get a cutthrough connection open when
1144    one was requested and a recipient-verify wasn't subsequently done.
1145 */
1146 int
1147 open_cutthrough_connection( address_item * addr )
1148 {
1149 address_item addr2;
1150 int rc;
1151
1152 /* Use a recipient-verify-callout to set up the cutthrough connection. */
1153 /* We must use a copy of the address for verification, because it might
1154 get rewritten. */
1155
1156 addr2 = *addr;
1157 HDEBUG(D_acl) debug_printf_indent("----------- %s cutthrough setup ------------\n",
1158   rcpt_count > 1 ? "more" : "start");
1159 rc = verify_address(&addr2, NULL,
1160         vopt_is_recipient | vopt_callout_recipsender | vopt_callout_no_cache,
1161         CUTTHROUGH_CMD_TIMEOUT, -1, -1,
1162         NULL, NULL, NULL);
1163 addr->message = addr2.message;
1164 addr->user_message = addr2.user_message;
1165 HDEBUG(D_acl) debug_printf_indent("----------- end cutthrough setup ------------\n");
1166 return rc;
1167 }
1168
1169
1170
1171 /* Send given number of bytes from the buffer */
1172 static BOOL
1173 cutthrough_send(int n)
1174 {
1175 if(cutthrough.fd < 0)
1176   return TRUE;
1177
1178 if(
1179 #ifdef SUPPORT_TLS
1180    (tls_out.active == cutthrough.fd) ? tls_write(FALSE, ctblock.buffer, n) :
1181 #endif
1182    send(cutthrough.fd, ctblock.buffer, n, 0) > 0
1183   )
1184 {
1185   transport_count += n;
1186   ctblock.ptr= ctblock.buffer;
1187   return TRUE;
1188 }
1189
1190 HDEBUG(D_transport|D_acl) debug_printf_indent("cutthrough_send failed: %s\n", strerror(errno));
1191 return FALSE;
1192 }
1193
1194
1195
1196 static BOOL
1197 _cutthrough_puts(uschar * cp, int n)
1198 {
1199 while(n--)
1200  {
1201  if(ctblock.ptr >= ctblock.buffer+ctblock.buffersize)
1202    if(!cutthrough_send(ctblock.buffersize))
1203      return FALSE;
1204
1205  *ctblock.ptr++ = *cp++;
1206  }
1207 return TRUE;
1208 }
1209
1210 /* Buffered output of counted data block.   Return boolean success */
1211 static BOOL
1212 cutthrough_puts(uschar * cp, int n)
1213 {
1214 if (cutthrough.fd < 0)       return TRUE;
1215 if (_cutthrough_puts(cp, n)) return TRUE;
1216 cancel_cutthrough_connection(TRUE, US"transmit failed");
1217 return FALSE;
1218 }
1219
1220 void
1221 cutthrough_data_puts(uschar * cp, int n)
1222 {
1223 if (cutthrough.delivery) (void) cutthrough_puts(cp, n);
1224 return;
1225 }
1226
1227
1228 static BOOL
1229 _cutthrough_flush_send(void)
1230 {
1231 int n = ctblock.ptr - ctblock.buffer;
1232
1233 if(n>0)
1234   if(!cutthrough_send(n))
1235     return FALSE;
1236 return TRUE;
1237 }
1238
1239
1240 /* Send out any bufferred output.  Return boolean success. */
1241 BOOL
1242 cutthrough_flush_send(void)
1243 {
1244 if (_cutthrough_flush_send()) return TRUE;
1245 cancel_cutthrough_connection(TRUE, US"transmit failed");
1246 return FALSE;
1247 }
1248
1249
1250 static BOOL
1251 cutthrough_put_nl(void)
1252 {
1253 return cutthrough_puts(US"\r\n", 2);
1254 }
1255
1256
1257 void
1258 cutthrough_data_put_nl(void)
1259 {
1260 cutthrough_data_puts(US"\r\n", 2);
1261 }
1262
1263
1264 /* Get and check response from cutthrough target */
1265 static uschar
1266 cutthrough_response(int fd, char expect, uschar ** copy, int timeout)
1267 {
1268 smtp_inblock inblock;
1269 uschar inbuffer[4096];
1270 uschar responsebuffer[4096];
1271
1272 inblock.buffer = inbuffer;
1273 inblock.buffersize = sizeof(inbuffer);
1274 inblock.ptr = inbuffer;
1275 inblock.ptrend = inbuffer;
1276 inblock.sock = fd;
1277 /* this relies on (inblock.sock == tls_out.active) */
1278 if(!smtp_read_response(&inblock, responsebuffer, sizeof(responsebuffer), expect, timeout))
1279   cancel_cutthrough_connection(TRUE, US"target timeout on read");
1280
1281 if(copy)
1282   {
1283   uschar * cp;
1284   *copy = cp = string_copy(responsebuffer);
1285   /* Trim the trailing end of line */
1286   cp += Ustrlen(responsebuffer);
1287   if(cp > *copy  &&  cp[-1] == '\n') *--cp = '\0';
1288   if(cp > *copy  &&  cp[-1] == '\r') *--cp = '\0';
1289   }
1290
1291 return responsebuffer[0];
1292 }
1293
1294
1295 /* Negotiate dataphase with the cutthrough target, returning success boolean */
1296 BOOL
1297 cutthrough_predata(void)
1298 {
1299 if(cutthrough.fd < 0 || cutthrough.callout_hold_only)
1300   return FALSE;
1301
1302 HDEBUG(D_transport|D_acl|D_v) debug_printf_indent("  SMTP>> DATA\n");
1303 cutthrough_puts(US"DATA\r\n", 6);
1304 cutthrough_flush_send();
1305
1306 /* Assume nothing buffered.  If it was it gets ignored. */
1307 return cutthrough_response(cutthrough.fd, '3', NULL, CUTTHROUGH_DATA_TIMEOUT) == '3';
1308 }
1309
1310
1311 /* tctx arg only to match write_chunk() */
1312 static BOOL
1313 cutthrough_write_chunk(transport_ctx * tctx, uschar * s, int len)
1314 {
1315 uschar * s2;
1316 while(s && (s2 = Ustrchr(s, '\n')))
1317  {
1318  if(!cutthrough_puts(s, s2-s) || !cutthrough_put_nl())
1319   return FALSE;
1320  s = s2+1;
1321  }
1322 return TRUE;
1323 }
1324
1325
1326 /* Buffered send of headers.  Return success boolean. */
1327 /* Expands newlines to wire format (CR,NL).           */
1328 /* Also sends header-terminating blank line.          */
1329 BOOL
1330 cutthrough_headers_send(void)
1331 {
1332 transport_ctx tctx;
1333
1334 if(cutthrough.fd < 0 || cutthrough.callout_hold_only)
1335   return FALSE;
1336
1337 /* We share a routine with the mainline transport to handle header add/remove/rewrites,
1338    but having a separate buffered-output function (for now)
1339 */
1340 HDEBUG(D_acl) debug_printf_indent("----------- start cutthrough headers send -----------\n");
1341
1342 tctx.u.fd = cutthrough.fd;
1343 tctx.tblock = cutthrough.addr.transport;
1344 tctx.addr = &cutthrough.addr;
1345 tctx.check_string = US".";
1346 tctx.escape_string = US"..";
1347 tctx.options = topt_use_crlf;
1348
1349 if (!transport_headers_send(&tctx, &cutthrough_write_chunk))
1350   return FALSE;
1351
1352 HDEBUG(D_acl) debug_printf_indent("----------- done cutthrough headers send ------------\n");
1353 return TRUE;
1354 }
1355
1356
1357 static void
1358 close_cutthrough_connection(const uschar * why)
1359 {
1360 int fd = cutthrough.fd;
1361 if(fd >= 0)
1362   {
1363   /* We could be sending this after a bunch of data, but that is ok as
1364      the only way to cancel the transfer in dataphase is to drop the tcp
1365      conn before the final dot.
1366   */
1367   ctblock.ptr = ctbuffer;
1368   HDEBUG(D_transport|D_acl|D_v) debug_printf_indent("  SMTP>> QUIT\n");
1369   _cutthrough_puts(US"QUIT\r\n", 6);    /* avoid recursion */
1370   _cutthrough_flush_send();
1371   cutthrough.fd = -1;                   /* avoid recursion via read timeout */
1372
1373   /* Wait a short time for response, and discard it */
1374   cutthrough_response(fd, '2', NULL, 1);
1375
1376 #ifdef SUPPORT_TLS
1377   tls_close(FALSE, TRUE);
1378 #endif
1379   HDEBUG(D_transport|D_acl|D_v) debug_printf_indent("  SMTP(close)>>\n");
1380   (void)close(fd);
1381   HDEBUG(D_acl) debug_printf_indent("----------- cutthrough shutdown (%s) ------------\n", why);
1382   }
1383 ctblock.ptr = ctbuffer;
1384 }
1385
1386 void
1387 cancel_cutthrough_connection(BOOL close_noncutthrough_verifies, const uschar * why)
1388 {
1389 if (cutthrough.delivery || close_noncutthrough_verifies)
1390   close_cutthrough_connection(why);
1391 cutthrough.delivery = cutthrough.callout_hold_only = FALSE;
1392 }
1393
1394
1395 void
1396 release_cutthrough_connection(const uschar * why)
1397 {
1398 if (cutthrough.fd < 0) return;
1399 HDEBUG(D_acl) debug_printf_indent("release cutthrough conn: %s\n", why);
1400 cutthrough.fd = -1;
1401 cutthrough.delivery = cutthrough.callout_hold_only = FALSE;
1402 }
1403
1404
1405
1406
1407 /* Have senders final-dot.  Send one to cutthrough target, and grab the response.
1408    Log an OK response as a transmission.
1409    Close the connection.
1410    Return smtp response-class digit.
1411 */
1412 uschar *
1413 cutthrough_finaldot(void)
1414 {
1415 uschar res;
1416 address_item * addr;
1417 HDEBUG(D_transport|D_acl|D_v) debug_printf_indent("  SMTP>> .\n");
1418
1419 /* Assume data finshed with new-line */
1420 if(  !cutthrough_puts(US".", 1)
1421   || !cutthrough_put_nl()
1422   || !cutthrough_flush_send()
1423   )
1424   return cutthrough.addr.message;
1425
1426 res = cutthrough_response(cutthrough.fd, '2', &cutthrough.addr.message, CUTTHROUGH_DATA_TIMEOUT);
1427 for (addr = &cutthrough.addr; addr; addr = addr->next)
1428   {
1429   addr->message = cutthrough.addr.message;
1430   switch(res)
1431     {
1432     case '2':
1433       delivery_log(LOG_MAIN, addr, (int)'>', NULL);
1434       close_cutthrough_connection(US"delivered");
1435       break;
1436
1437     case '4':
1438       delivery_log(LOG_MAIN, addr, 0,
1439         US"tmp-reject from cutthrough after DATA:");
1440       break;
1441
1442     case '5':
1443       delivery_log(LOG_MAIN|LOG_REJECT, addr, 0,
1444         US"rejected after DATA:");
1445       break;
1446
1447     default:
1448       break;
1449     }
1450   }
1451 return cutthrough.addr.message;
1452 }
1453
1454
1455
1456 /*************************************************
1457 *           Copy error to toplevel address       *
1458 *************************************************/
1459
1460 /* This function is used when a verify fails or defers, to ensure that the
1461 failure or defer information is in the original toplevel address. This applies
1462 when an address is redirected to a single new address, and the failure or
1463 deferral happens to the child address.
1464
1465 Arguments:
1466   vaddr       the verify address item
1467   addr        the final address item
1468   yield       FAIL or DEFER
1469
1470 Returns:      the value of YIELD
1471 */
1472
1473 static int
1474 copy_error(address_item *vaddr, address_item *addr, int yield)
1475 {
1476 if (addr != vaddr)
1477   {
1478   vaddr->message = addr->message;
1479   vaddr->user_message = addr->user_message;
1480   vaddr->basic_errno = addr->basic_errno;
1481   vaddr->more_errno = addr->more_errno;
1482   vaddr->prop.address_data = addr->prop.address_data;
1483   copyflag(vaddr, addr, af_pass_message);
1484   }
1485 return yield;
1486 }
1487
1488
1489
1490
1491 /**************************************************
1492 * printf that automatically handles TLS if needed *
1493 ***************************************************/
1494
1495 /* This function is used by verify_address() as a substitute for all fprintf()
1496 calls; a direct fprintf() will not produce output in a TLS SMTP session, such
1497 as a response to an EXPN command.  smtp_in.c makes smtp_printf available but
1498 that assumes that we always use the smtp_out FILE* when not using TLS or the
1499 ssl buffer when we are.  Instead we take a FILE* parameter and check to see if
1500 that is smtp_out; if so, smtp_printf() with TLS support, otherwise regular
1501 fprintf().
1502
1503 Arguments:
1504   f           the candidate FILE* to write to
1505   format      format string
1506   ...         optional arguments
1507
1508 Returns:
1509               nothing
1510 */
1511
1512 static void PRINTF_FUNCTION(2,3)
1513 respond_printf(FILE *f, const char *format, ...)
1514 {
1515 va_list ap;
1516
1517 va_start(ap, format);
1518 if (smtp_out && (f == smtp_out))
1519   smtp_vprintf(format, ap);
1520 else
1521   vfprintf(f, format, ap);
1522 va_end(ap);
1523 }
1524
1525
1526
1527 /*************************************************
1528 *            Verify an email address             *
1529 *************************************************/
1530
1531 /* This function is used both for verification (-bv and at other times) and
1532 address testing (-bt), which is indicated by address_test_mode being set.
1533
1534 Arguments:
1535   vaddr            contains the address to verify; the next field in this block
1536                      must be NULL
1537   f                if not NULL, write the result to this file
1538   options          various option bits:
1539                      vopt_fake_sender => this sender verify is not for the real
1540                        sender (it was verify=sender=xxxx or an address from a
1541                        header line) - rewriting must not change sender_address
1542                      vopt_is_recipient => this is a recipient address, otherwise
1543                        it's a sender address - this affects qualification and
1544                        rewriting and messages from callouts
1545                      vopt_qualify => qualify an unqualified address; else error
1546                      vopt_expn => called from SMTP EXPN command
1547                      vopt_success_on_redirect => when a new address is generated
1548                        the verification instantly succeeds
1549
1550                      These ones are used by do_callout() -- the options variable
1551                        is passed to it.
1552
1553                      vopt_callout_fullpm => if postmaster check, do full one
1554                      vopt_callout_no_cache => don't use callout cache
1555                      vopt_callout_random => do the "random" thing
1556                      vopt_callout_recipsender => use real sender for recipient
1557                      vopt_callout_recippmaster => use postmaster for recipient
1558
1559   callout          if > 0, specifies that callout is required, and gives timeout
1560                      for individual commands
1561   callout_overall  if > 0, gives overall timeout for the callout function;
1562                    if < 0, a default is used (see do_callout())
1563   callout_connect  the connection timeout for callouts
1564   se_mailfrom      when callout is requested to verify a sender, use this
1565                      in MAIL FROM; NULL => ""
1566   pm_mailfrom      when callout is requested, if non-NULL, do the postmaster
1567                      thing and use this as the sender address (may be "")
1568
1569   routed           if not NULL, set TRUE if routing succeeded, so we can
1570                      distinguish between routing failed and callout failed
1571
1572 Returns:           OK      address verified
1573                    FAIL    address failed to verify
1574                    DEFER   can't tell at present
1575 */
1576
1577 int
1578 verify_address(address_item *vaddr, FILE *f, int options, int callout,
1579   int callout_overall, int callout_connect, uschar *se_mailfrom,
1580   uschar *pm_mailfrom, BOOL *routed)
1581 {
1582 BOOL allok = TRUE;
1583 BOOL full_info = (f == NULL)? FALSE : (debug_selector != 0);
1584 BOOL expn         = (options & vopt_expn) != 0;
1585 BOOL success_on_redirect = (options & vopt_success_on_redirect) != 0;
1586 int i;
1587 int yield = OK;
1588 int verify_type = expn? v_expn :
1589      address_test_mode? v_none :
1590           options & vopt_is_recipient? v_recipient : v_sender;
1591 address_item *addr_list;
1592 address_item *addr_new = NULL;
1593 address_item *addr_remote = NULL;
1594 address_item *addr_local = NULL;
1595 address_item *addr_succeed = NULL;
1596 uschar **failure_ptr = options & vopt_is_recipient
1597   ? &recipient_verify_failure : &sender_verify_failure;
1598 uschar *ko_prefix, *cr;
1599 uschar *address = vaddr->address;
1600 uschar *save_sender;
1601 uschar null_sender[] = { 0 };             /* Ensure writeable memory */
1602
1603 /* Clear, just in case */
1604
1605 *failure_ptr = NULL;
1606
1607 /* Set up a prefix and suffix for error message which allow us to use the same
1608 output statements both in EXPN mode (where an SMTP response is needed) and when
1609 debugging with an output file. */
1610
1611 if (expn)
1612   {
1613   ko_prefix = US"553 ";
1614   cr = US"\r";
1615   }
1616 else ko_prefix = cr = US"";
1617
1618 /* Add qualify domain if permitted; otherwise an unqualified address fails. */
1619
1620 if (parse_find_at(address) == NULL)
1621   {
1622   if ((options & vopt_qualify) == 0)
1623     {
1624     if (f != NULL)
1625       respond_printf(f, "%sA domain is required for \"%s\"%s\n",
1626         ko_prefix, address, cr);
1627     *failure_ptr = US"qualify";
1628     return FAIL;
1629     }
1630   address = rewrite_address_qualify(address, options & vopt_is_recipient);
1631   }
1632
1633 DEBUG(D_verify)
1634   {
1635   debug_printf(">>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>\n");
1636   debug_printf("%s %s\n", address_test_mode? "Testing" : "Verifying", address);
1637   }
1638
1639 /* Rewrite and report on it. Clear the domain and local part caches - these
1640 may have been set by domains and local part tests during an ACL. */
1641
1642 if (global_rewrite_rules != NULL)
1643   {
1644   uschar *old = address;
1645   address = rewrite_address(address, options & vopt_is_recipient, FALSE,
1646     global_rewrite_rules, rewrite_existflags);
1647   if (address != old)
1648     {
1649     for (i = 0; i < (MAX_NAMED_LIST * 2)/32; i++) vaddr->localpart_cache[i] = 0;
1650     for (i = 0; i < (MAX_NAMED_LIST * 2)/32; i++) vaddr->domain_cache[i] = 0;
1651     if (f != NULL && !expn) fprintf(f, "Address rewritten as: %s\n", address);
1652     }
1653   }
1654
1655 /* If this is the real sender address, we must update sender_address at
1656 this point, because it may be referred to in the routers. */
1657
1658 if ((options & (vopt_fake_sender|vopt_is_recipient)) == 0)
1659   sender_address = address;
1660
1661 /* If the address was rewritten to <> no verification can be done, and we have
1662 to return OK. This rewriting is permitted only for sender addresses; for other
1663 addresses, such rewriting fails. */
1664
1665 if (address[0] == 0) return OK;
1666
1667 /* Flip the legacy TLS-related variables over to the outbound set in case
1668 they're used in the context of a transport used by verification. Reset them
1669 at exit from this routine (so no returns allowed from here on). */
1670
1671 tls_modify_variables(&tls_out);
1672
1673 /* Save a copy of the sender address for re-instating if we change it to <>
1674 while verifying a sender address (a nice bit of self-reference there). */
1675
1676 save_sender = sender_address;
1677
1678 /* Observability variable for router/transport use */
1679
1680 verify_mode = options & vopt_is_recipient ? US"R" : US"S";
1681
1682 /* Update the address structure with the possibly qualified and rewritten
1683 address. Set it up as the starting address on the chain of new addresses. */
1684
1685 vaddr->address = address;
1686 addr_new = vaddr;
1687
1688 /* We need a loop, because an address can generate new addresses. We must also
1689 cope with generated pipes and files at the top level. (See also the code and
1690 comment in deliver.c.) However, it is usually the case that the router for
1691 user's .forward files has its verify flag turned off.
1692
1693 If an address generates more than one child, the loop is used only when
1694 full_info is set, and this can only be set locally. Remote enquiries just get
1695 information about the top level address, not anything that it generated. */
1696
1697 while (addr_new)
1698   {
1699   int rc;
1700   address_item *addr = addr_new;
1701
1702   addr_new = addr->next;
1703   addr->next = NULL;
1704
1705   DEBUG(D_verify)
1706     {
1707     debug_printf(">>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>\n");
1708     debug_printf("Considering %s\n", addr->address);
1709     }
1710
1711   /* Handle generated pipe, file or reply addresses. We don't get these
1712   when handling EXPN, as it does only one level of expansion. */
1713
1714   if (testflag(addr, af_pfr))
1715     {
1716     allok = FALSE;
1717     if (f != NULL)
1718       {
1719       BOOL allow;
1720
1721       if (addr->address[0] == '>')
1722         {
1723         allow = testflag(addr, af_allow_reply);
1724         fprintf(f, "%s -> mail %s", addr->parent->address, addr->address + 1);
1725         }
1726       else
1727         {
1728         allow = (addr->address[0] == '|')?
1729           testflag(addr, af_allow_pipe) : testflag(addr, af_allow_file);
1730         fprintf(f, "%s -> %s", addr->parent->address, addr->address);
1731         }
1732
1733       if (addr->basic_errno == ERRNO_BADTRANSPORT)
1734         fprintf(f, "\n*** Error in setting up pipe, file, or autoreply:\n"
1735           "%s\n", addr->message);
1736       else if (allow)
1737         fprintf(f, "\n  transport = %s\n", addr->transport->name);
1738       else
1739         fprintf(f, " *** forbidden ***\n");
1740       }
1741     continue;
1742     }
1743
1744   /* Just in case some router parameter refers to it. */
1745
1746   return_path = addr->prop.errors_address
1747     ? addr->prop.errors_address : sender_address;
1748
1749   /* Split the address into domain and local part, handling the %-hack if
1750   necessary, and then route it. While routing a sender address, set
1751   $sender_address to <> because that is what it will be if we were trying to
1752   send a bounce to the sender. */
1753
1754   if (routed) *routed = FALSE;
1755   if ((rc = deliver_split_address(addr)) == OK)
1756     {
1757     if (!(options & vopt_is_recipient)) sender_address = null_sender;
1758     rc = route_address(addr, &addr_local, &addr_remote, &addr_new,
1759       &addr_succeed, verify_type);
1760     sender_address = save_sender;     /* Put back the real sender */
1761     }
1762
1763   /* If routing an address succeeded, set the flag that remembers, for use when
1764   an ACL cached a sender verify (in case a callout fails). Then if routing set
1765   up a list of hosts or the transport has a host list, and the callout option
1766   is set, and we aren't in a host checking run, do the callout verification,
1767   and set another flag that notes that a callout happened. */
1768
1769   if (rc == OK)
1770     {
1771     if (routed) *routed = TRUE;
1772     if (callout > 0)
1773       {
1774       transport_instance * tp;
1775       host_item * host_list = addr->host_list;
1776
1777       /* Make up some data for use in the case where there is no remote
1778       transport. */
1779
1780       transport_feedback tf = {
1781         NULL,                       /* interface (=> any) */
1782         US"smtp",                   /* port */
1783         US"smtp",                   /* protocol */
1784         NULL,                       /* hosts */
1785         US"$smtp_active_hostname",  /* helo_data */
1786         FALSE,                      /* hosts_override */
1787         FALSE,                      /* hosts_randomize */
1788         FALSE,                      /* gethostbyname */
1789         TRUE,                       /* qualify_single */
1790         FALSE                       /* search_parents */
1791         };
1792
1793       /* If verification yielded a remote transport, we want to use that
1794       transport's options, so as to mimic what would happen if we were really
1795       sending a message to this address. */
1796
1797       if ((tp = addr->transport) && !tp->info->local)
1798         {
1799         (void)(tp->setup)(tp, addr, &tf, 0, 0, NULL);
1800
1801         /* If the transport has hosts and the router does not, or if the
1802         transport is configured to override the router's hosts, we must build a
1803         host list of the transport's hosts, and find the IP addresses */
1804
1805         if (tf.hosts && (!host_list || tf.hosts_override))
1806           {
1807           uschar *s;
1808           const uschar *save_deliver_domain = deliver_domain;
1809           uschar *save_deliver_localpart = deliver_localpart;
1810
1811           host_list = NULL;    /* Ignore the router's hosts */
1812
1813           deliver_domain = addr->domain;
1814           deliver_localpart = addr->local_part;
1815           s = expand_string(tf.hosts);
1816           deliver_domain = save_deliver_domain;
1817           deliver_localpart = save_deliver_localpart;
1818
1819           if (!s)
1820             {
1821             log_write(0, LOG_MAIN|LOG_PANIC, "failed to expand list of hosts "
1822               "\"%s\" in %s transport for callout: %s", tf.hosts,
1823               tp->name, expand_string_message);
1824             }
1825           else
1826             {
1827             int flags;
1828             host_item *host, *nexthost;
1829             host_build_hostlist(&host_list, s, tf.hosts_randomize);
1830
1831             /* Just ignore failures to find a host address. If we don't manage
1832             to find any addresses, the callout will defer. Note that more than
1833             one address may be found for a single host, which will result in
1834             additional host items being inserted into the chain. Hence we must
1835             save the next host first. */
1836
1837             flags = HOST_FIND_BY_A;
1838             if (tf.qualify_single) flags |= HOST_FIND_QUALIFY_SINGLE;
1839             if (tf.search_parents) flags |= HOST_FIND_SEARCH_PARENTS;
1840
1841             for (host = host_list; host; host = nexthost)
1842               {
1843               nexthost = host->next;
1844               if (tf.gethostbyname ||
1845                   string_is_ip_address(host->name, NULL) != 0)
1846                 (void)host_find_byname(host, NULL, flags, NULL, TRUE);
1847               else
1848                 {
1849                 dnssec_domains * dnssec_domains = NULL;
1850                 if (Ustrcmp(tp->driver_name, "smtp") == 0)
1851                   {
1852                   smtp_transport_options_block * ob =
1853                       (smtp_transport_options_block *) tp->options_block;
1854                   dnssec_domains = &ob->dnssec;
1855                   }
1856
1857                 (void) host_find_bydns(host, NULL, flags, NULL, NULL, NULL,
1858                   dnssec_domains, NULL, NULL);
1859                 }
1860               }
1861             }
1862           }
1863         }
1864
1865       /* Can only do a callout if we have at least one host! If the callout
1866       fails, it will have set ${sender,recipient}_verify_failure. */
1867
1868       if (host_list)
1869         {
1870         HDEBUG(D_verify) debug_printf("Attempting full verification using callout\n");
1871         if (host_checking && !host_checking_callout)
1872           {
1873           HDEBUG(D_verify)
1874             debug_printf("... callout omitted by default when host testing\n"
1875               "(Use -bhc if you want the callouts to happen.)\n");
1876           }
1877         else
1878           {
1879 #ifdef SUPPORT_TLS
1880           deliver_set_expansions(addr);
1881 #endif
1882           rc = do_callout(addr, host_list, &tf, callout, callout_overall,
1883             callout_connect, options, se_mailfrom, pm_mailfrom);
1884           }
1885         }
1886       else
1887         {
1888         HDEBUG(D_verify) debug_printf("Cannot do callout: neither router nor "
1889           "transport provided a host list\n");
1890         }
1891       }
1892     }
1893
1894   /* Otherwise, any failure is a routing failure */
1895
1896   else *failure_ptr = US"route";
1897
1898   /* A router may return REROUTED if it has set up a child address as a result
1899   of a change of domain name (typically from widening). In this case we always
1900   want to continue to verify the new child. */
1901
1902   if (rc == REROUTED) continue;
1903
1904   /* Handle hard failures */
1905
1906   if (rc == FAIL)
1907     {
1908     allok = FALSE;
1909     if (f)
1910       {
1911       address_item *p = addr->parent;
1912
1913       respond_printf(f, "%s%s %s", ko_prefix,
1914         full_info ? addr->address : address,
1915         address_test_mode ? "is undeliverable" : "failed to verify");
1916       if (!expn && admin_user)
1917         {
1918         if (addr->basic_errno > 0)
1919           respond_printf(f, ": %s", strerror(addr->basic_errno));
1920         if (addr->message)
1921           respond_printf(f, ": %s", addr->message);
1922         }
1923
1924       /* Show parents iff doing full info */
1925
1926       if (full_info) while (p)
1927         {
1928         respond_printf(f, "%s\n    <-- %s", cr, p->address);
1929         p = p->parent;
1930         }
1931       respond_printf(f, "%s\n", cr);
1932       }
1933     cancel_cutthrough_connection(TRUE, US"routing hard fail");
1934
1935     if (!full_info)
1936       {
1937       yield = copy_error(vaddr, addr, FAIL);
1938       goto out;
1939       }
1940     yield = FAIL;
1941     }
1942
1943   /* Soft failure */
1944
1945   else if (rc == DEFER)
1946     {
1947     allok = FALSE;
1948     if (f)
1949       {
1950       address_item *p = addr->parent;
1951       respond_printf(f, "%s%s cannot be resolved at this time", ko_prefix,
1952         full_info? addr->address : address);
1953       if (!expn && admin_user)
1954         {
1955         if (addr->basic_errno > 0)
1956           respond_printf(f, ": %s", strerror(addr->basic_errno));
1957         if (addr->message)
1958           respond_printf(f, ": %s", addr->message);
1959         else if (addr->basic_errno <= 0)
1960           respond_printf(f, ": unknown error");
1961         }
1962
1963       /* Show parents iff doing full info */
1964
1965       if (full_info) while (p)
1966         {
1967         respond_printf(f, "%s\n    <-- %s", cr, p->address);
1968         p = p->parent;
1969         }
1970       respond_printf(f, "%s\n", cr);
1971       }
1972     cancel_cutthrough_connection(TRUE, US"routing soft fail");
1973
1974     if (!full_info)
1975       {
1976       yield = copy_error(vaddr, addr, DEFER);
1977       goto out;
1978       }
1979     if (yield == OK) yield = DEFER;
1980     }
1981
1982   /* If we are handling EXPN, we do not want to continue to route beyond
1983   the top level (whose address is in "address"). */
1984
1985   else if (expn)
1986     {
1987     uschar *ok_prefix = US"250-";
1988
1989     if (!addr_new)
1990       if (!addr_local && !addr_remote)
1991         respond_printf(f, "250 mail to <%s> is discarded\r\n", address);
1992       else
1993         respond_printf(f, "250 <%s>\r\n", address);
1994
1995     else do
1996       {
1997       address_item *addr2 = addr_new;
1998       addr_new = addr2->next;
1999       if (!addr_new) ok_prefix = US"250 ";
2000       respond_printf(f, "%s<%s>\r\n", ok_prefix, addr2->address);
2001       } while (addr_new);
2002     yield = OK;
2003     goto out;
2004     }
2005
2006   /* Successful routing other than EXPN. */
2007
2008   else
2009     {
2010     /* Handle successful routing when short info wanted. Otherwise continue for
2011     other (generated) addresses. Short info is the operational case. Full info
2012     can be requested only when debug_selector != 0 and a file is supplied.
2013
2014     There is a conflict between the use of aliasing as an alternate email
2015     address, and as a sort of mailing list. If an alias turns the incoming
2016     address into just one address (e.g. J.Caesar->jc44) you may well want to
2017     carry on verifying the generated address to ensure it is valid when
2018     checking incoming mail. If aliasing generates multiple addresses, you
2019     probably don't want to do this. Exim therefore treats the generation of
2020     just a single new address as a special case, and continues on to verify the
2021     generated address. */
2022
2023     if (  !full_info                    /* Stop if short info wanted AND */
2024        && (  (  !addr_new               /* No new address OR */
2025              || addr_new->next          /* More than one new address OR */
2026              || testflag(addr_new, af_pfr)      /* New address is pfr */
2027              )
2028           ||                            /* OR */
2029              (  addr_new                /* At least one new address AND */
2030              && success_on_redirect     /* success_on_redirect is set */
2031           )  )
2032        )
2033       {
2034       if (f) fprintf(f, "%s %s\n",
2035         address, address_test_mode ? "is deliverable" : "verified");
2036
2037       /* If we have carried on to verify a child address, we want the value
2038       of $address_data to be that of the child */
2039
2040       vaddr->prop.address_data = addr->prop.address_data;
2041
2042       /* If stopped because more than one new address, cannot cutthrough */
2043
2044       if (addr_new && addr_new->next)
2045         cancel_cutthrough_connection(TRUE, US"multiple addresses from routing");
2046
2047       yield = OK;
2048       goto out;
2049       }
2050     }
2051   }     /* Loop for generated addresses */
2052
2053 /* Display the full results of the successful routing, including any generated
2054 addresses. Control gets here only when full_info is set, which requires f not
2055 to be NULL, and this occurs only when a top-level verify is called with the
2056 debugging switch on.
2057
2058 If there are no local and no remote addresses, and there were no pipes, files,
2059 or autoreplies, and there were no errors or deferments, the message is to be
2060 discarded, usually because of the use of :blackhole: in an alias file. */
2061
2062 if (allok && !addr_local && !addr_remote)
2063   {
2064   fprintf(f, "mail to %s is discarded\n", address);
2065   goto out;
2066   }
2067
2068 for (addr_list = addr_local, i = 0; i < 2; addr_list = addr_remote, i++)
2069   while (addr_list)
2070     {
2071     address_item *addr = addr_list;
2072     address_item *p = addr->parent;
2073     transport_instance * tp = addr->transport;
2074
2075     addr_list = addr->next;
2076
2077     fprintf(f, "%s", CS addr->address);
2078 #ifdef EXPERIMENTAL_SRS
2079     if(addr->prop.srs_sender)
2080       fprintf(f, "    [srs = %s]", addr->prop.srs_sender);
2081 #endif
2082
2083     /* If the address is a duplicate, show something about it. */
2084
2085     if (!testflag(addr, af_pfr))
2086       {
2087       tree_node *tnode;
2088       if ((tnode = tree_search(tree_duplicates, addr->unique)))
2089         fprintf(f, "   [duplicate, would not be delivered]");
2090       else tree_add_duplicate(addr->unique, addr);
2091       }
2092
2093     /* Now show its parents */
2094
2095     for (p = addr->parent; p; p = p->parent)
2096       fprintf(f, "\n    <-- %s", p->address);
2097     fprintf(f, "\n  ");
2098
2099     /* Show router, and transport */
2100
2101     fprintf(f, "router = %s, transport = %s\n",
2102       addr->router->name, tp ? tp->name : US"unset");
2103
2104     /* Show any hosts that are set up by a router unless the transport
2105     is going to override them; fiddle a bit to get a nice format. */
2106
2107     if (addr->host_list && tp && !tp->overrides_hosts)
2108       {
2109       host_item *h;
2110       int maxlen = 0;
2111       int maxaddlen = 0;
2112       for (h = addr->host_list; h; h = h->next)
2113         {                               /* get max lengths of host names, addrs */
2114         int len = Ustrlen(h->name);
2115         if (len > maxlen) maxlen = len;
2116         len = h->address ? Ustrlen(h->address) : 7;
2117         if (len > maxaddlen) maxaddlen = len;
2118         }
2119       for (h = addr->host_list; h; h = h->next)
2120         {
2121         fprintf(f, "  host %-*s ", maxlen, h->name);
2122
2123         if (h->address)
2124           fprintf(f, "[%s%-*c", h->address, maxaddlen+1 - Ustrlen(h->address), ']');
2125         else if (tp->info->local)
2126           fprintf(f, " %-*s ", maxaddlen, "");  /* Omit [unknown] for local */
2127         else
2128           fprintf(f, "[%s%-*c", "unknown", maxaddlen+1 - 7, ']');
2129
2130         if (h->mx >= 0) fprintf(f, " MX=%d", h->mx);
2131         if (h->port != PORT_NONE) fprintf(f, " port=%d", h->port);
2132         if (running_in_test_harness  &&  h->dnssec == DS_YES) fputs(" AD", f);
2133         if (h->status == hstatus_unusable) fputs(" ** unusable **", f);
2134         fputc('\n', f);
2135         }
2136       }
2137     }
2138
2139 /* Yield will be DEFER or FAIL if any one address has, only for full_info (which is
2140 the -bv or -bt case). */
2141
2142 out:
2143 verify_mode = NULL;
2144 tls_modify_variables(&tls_in);
2145
2146 return yield;
2147 }
2148
2149
2150
2151
2152 /*************************************************
2153 *      Check headers for syntax errors           *
2154 *************************************************/
2155
2156 /* This function checks those header lines that contain addresses, and verifies
2157 that all the addresses therein are syntactially correct.
2158
2159 Arguments:
2160   msgptr     where to put an error message
2161
2162 Returns:     OK
2163              FAIL
2164 */
2165
2166 int
2167 verify_check_headers(uschar **msgptr)
2168 {
2169 header_line *h;
2170 uschar *colon, *s;
2171 int yield = OK;
2172
2173 for (h = header_list; h != NULL && yield == OK; h = h->next)
2174   {
2175   if (h->type != htype_from &&
2176       h->type != htype_reply_to &&
2177       h->type != htype_sender &&
2178       h->type != htype_to &&
2179       h->type != htype_cc &&
2180       h->type != htype_bcc)
2181     continue;
2182
2183   colon = Ustrchr(h->text, ':');
2184   s = colon + 1;
2185   while (isspace(*s)) s++;
2186
2187   /* Loop for multiple addresses in the header, enabling group syntax. Note
2188   that we have to reset this after the header has been scanned. */
2189
2190   parse_allow_group = TRUE;
2191
2192   while (*s != 0)
2193     {
2194     uschar *ss = parse_find_address_end(s, FALSE);
2195     uschar *recipient, *errmess;
2196     int terminator = *ss;
2197     int start, end, domain;
2198
2199     /* Temporarily terminate the string at this point, and extract the
2200     operative address within, allowing group syntax. */
2201
2202     *ss = 0;
2203     recipient = parse_extract_address(s,&errmess,&start,&end,&domain,FALSE);
2204     *ss = terminator;
2205
2206     /* Permit an unqualified address only if the message is local, or if the
2207     sending host is configured to be permitted to send them. */
2208
2209     if (recipient != NULL && domain == 0)
2210       {
2211       if (h->type == htype_from || h->type == htype_sender)
2212         {
2213         if (!allow_unqualified_sender) recipient = NULL;
2214         }
2215       else
2216         {
2217         if (!allow_unqualified_recipient) recipient = NULL;
2218         }
2219       if (recipient == NULL) errmess = US"unqualified address not permitted";
2220       }
2221
2222     /* It's an error if no address could be extracted, except for the special
2223     case of an empty address. */
2224
2225     if (recipient == NULL && Ustrcmp(errmess, "empty address") != 0)
2226       {
2227       uschar *verb = US"is";
2228       uschar *t = ss;
2229       uschar *tt = colon;
2230       int len;
2231
2232       /* Arrange not to include any white space at the end in the
2233       error message or the header name. */
2234
2235       while (t > s && isspace(t[-1])) t--;
2236       while (tt > h->text && isspace(tt[-1])) tt--;
2237
2238       /* Add the address that failed to the error message, since in a
2239       header with very many addresses it is sometimes hard to spot
2240       which one is at fault. However, limit the amount of address to
2241       quote - cases have been seen where, for example, a missing double
2242       quote in a humungous To: header creates an "address" that is longer
2243       than string_sprintf can handle. */
2244
2245       len = t - s;
2246       if (len > 1024)
2247         {
2248         len = 1024;
2249         verb = US"begins";
2250         }
2251
2252       /* deconst cast ok as we're passing a non-const to string_printing() */
2253       *msgptr = US string_printing(
2254         string_sprintf("%s: failing address in \"%.*s:\" header %s: %.*s",
2255           errmess, tt - h->text, h->text, verb, len, s));
2256
2257       yield = FAIL;
2258       break;          /* Out of address loop */
2259       }
2260
2261     /* Advance to the next address */
2262
2263     s = ss + (terminator? 1:0);
2264     while (isspace(*s)) s++;
2265     }   /* Next address */
2266
2267   parse_allow_group = FALSE;
2268   parse_found_group = FALSE;
2269   }     /* Next header unless yield has been set FALSE */
2270
2271 return yield;
2272 }
2273
2274
2275 /*************************************************
2276 *      Check header names for 8-bit characters   *
2277 *************************************************/
2278
2279 /* This function checks for invalid characters in header names. See
2280 RFC 5322, 2.2. and RFC 6532, 3.
2281
2282 Arguments:
2283   msgptr     where to put an error message
2284
2285 Returns:     OK
2286              FAIL
2287 */
2288
2289 int
2290 verify_check_header_names_ascii(uschar **msgptr)
2291 {
2292 header_line *h;
2293 uschar *colon, *s;
2294
2295 for (h = header_list; h; h = h->next)
2296   {
2297   colon = Ustrchr(h->text, ':');
2298   for(s = h->text; s < colon; s++)
2299     if ((*s < 33) || (*s > 126))
2300       {
2301       *msgptr = string_sprintf("Invalid character in header \"%.*s\" found",
2302                              colon - h->text, h->text);
2303       return FAIL;
2304       }
2305   }
2306 return OK;
2307 }
2308
2309 /*************************************************
2310 *          Check for blind recipients            *
2311 *************************************************/
2312
2313 /* This function checks that every (envelope) recipient is mentioned in either
2314 the To: or Cc: header lines, thus detecting blind carbon copies.
2315
2316 There are two ways of scanning that could be used: either scan the header lines
2317 and tick off the recipients, or scan the recipients and check the header lines.
2318 The original proposed patch did the former, but I have chosen to do the latter,
2319 because (a) it requires no memory and (b) will use fewer resources when there
2320 are many addresses in To: and/or Cc: and only one or two envelope recipients.
2321
2322 Arguments:   none
2323 Returns:     OK    if there are no blind recipients
2324              FAIL  if there is at least one blind recipient
2325 */
2326
2327 int
2328 verify_check_notblind(void)
2329 {
2330 int i;
2331 for (i = 0; i < recipients_count; i++)
2332   {
2333   header_line *h;
2334   BOOL found = FALSE;
2335   uschar *address = recipients_list[i].address;
2336
2337   for (h = header_list; !found && h != NULL; h = h->next)
2338     {
2339     uschar *colon, *s;
2340
2341     if (h->type != htype_to && h->type != htype_cc) continue;
2342
2343     colon = Ustrchr(h->text, ':');
2344     s = colon + 1;
2345     while (isspace(*s)) s++;
2346
2347     /* Loop for multiple addresses in the header, enabling group syntax. Note
2348     that we have to reset this after the header has been scanned. */
2349
2350     parse_allow_group = TRUE;
2351
2352     while (*s != 0)
2353       {
2354       uschar *ss = parse_find_address_end(s, FALSE);
2355       uschar *recipient,*errmess;
2356       int terminator = *ss;
2357       int start, end, domain;
2358
2359       /* Temporarily terminate the string at this point, and extract the
2360       operative address within, allowing group syntax. */
2361
2362       *ss = 0;
2363       recipient = parse_extract_address(s,&errmess,&start,&end,&domain,FALSE);
2364       *ss = terminator;
2365
2366       /* If we found a valid recipient that has a domain, compare it with the
2367       envelope recipient. Local parts are compared case-sensitively, domains
2368       case-insensitively. By comparing from the start with length "domain", we
2369       include the "@" at the end, which ensures that we are comparing the whole
2370       local part of each address. */
2371
2372       if (recipient != NULL && domain != 0)
2373         {
2374         found = Ustrncmp(recipient, address, domain) == 0 &&
2375                 strcmpic(recipient + domain, address + domain) == 0;
2376         if (found) break;
2377         }
2378
2379       /* Advance to the next address */
2380
2381       s = ss + (terminator? 1:0);
2382       while (isspace(*s)) s++;
2383       }   /* Next address */
2384
2385     parse_allow_group = FALSE;
2386     parse_found_group = FALSE;
2387     }     /* Next header (if found is false) */
2388
2389   if (!found) return FAIL;
2390   }       /* Next recipient */
2391
2392 return OK;
2393 }
2394
2395
2396
2397 /*************************************************
2398 *          Find if verified sender               *
2399 *************************************************/
2400
2401 /* Usually, just a single address is verified as the sender of the message.
2402 However, Exim can be made to verify other addresses as well (often related in
2403 some way), and this is useful in some environments. There may therefore be a
2404 chain of such addresses that have previously been tested. This function finds
2405 whether a given address is on the chain.
2406
2407 Arguments:   the address to be verified
2408 Returns:     pointer to an address item, or NULL
2409 */
2410
2411 address_item *
2412 verify_checked_sender(uschar *sender)
2413 {
2414 address_item *addr;
2415 for (addr = sender_verified_list; addr != NULL; addr = addr->next)
2416   if (Ustrcmp(sender, addr->address) == 0) break;
2417 return addr;
2418 }
2419
2420
2421
2422
2423
2424 /*************************************************
2425 *             Get valid header address           *
2426 *************************************************/
2427
2428 /* Scan the originator headers of the message, looking for an address that
2429 verifies successfully. RFC 822 says:
2430
2431     o   The "Sender" field mailbox should be sent  notices  of
2432         any  problems in transport or delivery of the original
2433         messages.  If there is no  "Sender"  field,  then  the
2434         "From" field mailbox should be used.
2435
2436     o   If the "Reply-To" field exists, then the reply  should
2437         go to the addresses indicated in that field and not to
2438         the address(es) indicated in the "From" field.
2439
2440 So we check a Sender field if there is one, else a Reply_to field, else a From
2441 field. As some strange messages may have more than one of these fields,
2442 especially if they are resent- fields, check all of them if there is more than
2443 one.
2444
2445 Arguments:
2446   user_msgptr      points to where to put a user error message
2447   log_msgptr       points to where to put a log error message
2448   callout          timeout for callout check (passed to verify_address())
2449   callout_overall  overall callout timeout (ditto)
2450   callout_connect  connect callout timeout (ditto)
2451   se_mailfrom      mailfrom for verify; NULL => ""
2452   pm_mailfrom      sender for pm callout check (passed to verify_address())
2453   options          callout options (passed to verify_address())
2454   verrno           where to put the address basic_errno
2455
2456 If log_msgptr is set to something without setting user_msgptr, the caller
2457 normally uses log_msgptr for both things.
2458
2459 Returns:           result of the verification attempt: OK, FAIL, or DEFER;
2460                    FAIL is given if no appropriate headers are found
2461 */
2462
2463 int
2464 verify_check_header_address(uschar **user_msgptr, uschar **log_msgptr,
2465   int callout, int callout_overall, int callout_connect, uschar *se_mailfrom,
2466   uschar *pm_mailfrom, int options, int *verrno)
2467 {
2468 static int header_types[] = { htype_sender, htype_reply_to, htype_from };
2469 BOOL done = FALSE;
2470 int yield = FAIL;
2471 int i;
2472
2473 for (i = 0; i < 3 && !done; i++)
2474   {
2475   header_line *h;
2476   for (h = header_list; h != NULL && !done; h = h->next)
2477     {
2478     int terminator, new_ok;
2479     uschar *s, *ss, *endname;
2480
2481     if (h->type != header_types[i]) continue;
2482     s = endname = Ustrchr(h->text, ':') + 1;
2483
2484     /* Scan the addresses in the header, enabling group syntax. Note that we
2485     have to reset this after the header has been scanned. */
2486
2487     parse_allow_group = TRUE;
2488
2489     while (*s != 0)
2490       {
2491       address_item *vaddr;
2492
2493       while (isspace(*s) || *s == ',') s++;
2494       if (*s == 0) break;        /* End of header */
2495
2496       ss = parse_find_address_end(s, FALSE);
2497
2498       /* The terminator is a comma or end of header, but there may be white
2499       space preceding it (including newline for the last address). Move back
2500       past any white space so we can check against any cached envelope sender
2501       address verifications. */
2502
2503       while (isspace(ss[-1])) ss--;
2504       terminator = *ss;
2505       *ss = 0;
2506
2507       HDEBUG(D_verify) debug_printf("verifying %.*s header address %s\n",
2508         (int)(endname - h->text), h->text, s);
2509
2510       /* See if we have already verified this address as an envelope sender,
2511       and if so, use the previous answer. */
2512
2513       vaddr = verify_checked_sender(s);
2514
2515       if (vaddr != NULL &&                   /* Previously checked */
2516            (callout <= 0 ||                  /* No callout needed; OR */
2517             vaddr->special_action > 256))    /* Callout was done */
2518         {
2519         new_ok = vaddr->special_action & 255;
2520         HDEBUG(D_verify) debug_printf("previously checked as envelope sender\n");
2521         *ss = terminator;  /* Restore shortened string */
2522         }
2523
2524       /* Otherwise we run the verification now. We must restore the shortened
2525       string before running the verification, so the headers are correct, in
2526       case there is any rewriting. */
2527
2528       else
2529         {
2530         int start, end, domain;
2531         uschar *address = parse_extract_address(s, log_msgptr, &start, &end,
2532           &domain, FALSE);
2533
2534         *ss = terminator;
2535
2536         /* If we found an empty address, just carry on with the next one, but
2537         kill the message. */
2538
2539         if (address == NULL && Ustrcmp(*log_msgptr, "empty address") == 0)
2540           {
2541           *log_msgptr = NULL;
2542           s = ss;
2543           continue;
2544           }
2545
2546         /* If verification failed because of a syntax error, fail this
2547         function, and ensure that the failing address gets added to the error
2548         message. */
2549
2550         if (address == NULL)
2551           {
2552           new_ok = FAIL;
2553           while (ss > s && isspace(ss[-1])) ss--;
2554           *log_msgptr = string_sprintf("syntax error in '%.*s' header when "
2555             "scanning for sender: %s in \"%.*s\"",
2556             endname - h->text, h->text, *log_msgptr, ss - s, s);
2557           yield = FAIL;
2558           done = TRUE;
2559           break;
2560           }
2561
2562         /* Else go ahead with the sender verification. But it isn't *the*
2563         sender of the message, so set vopt_fake_sender to stop sender_address
2564         being replaced after rewriting or qualification. */
2565
2566         else
2567           {
2568           vaddr = deliver_make_addr(address, FALSE);
2569           new_ok = verify_address(vaddr, NULL, options | vopt_fake_sender,
2570             callout, callout_overall, callout_connect, se_mailfrom,
2571             pm_mailfrom, NULL);
2572           }
2573         }
2574
2575       /* We now have the result, either newly found, or cached. If we are
2576       giving out error details, set a specific user error. This means that the
2577       last of these will be returned to the user if all three fail. We do not
2578       set a log message - the generic one below will be used. */
2579
2580       if (new_ok != OK)
2581         {
2582         *verrno = vaddr->basic_errno;
2583         if (smtp_return_error_details)
2584           {
2585           *user_msgptr = string_sprintf("Rejected after DATA: "
2586             "could not verify \"%.*s\" header address\n%s: %s",
2587             endname - h->text, h->text, vaddr->address, vaddr->message);
2588           }
2589         }
2590
2591       /* Success or defer */
2592
2593       if (new_ok == OK)
2594         {
2595         yield = OK;
2596         done = TRUE;
2597         break;
2598         }
2599
2600       if (new_ok == DEFER) yield = DEFER;
2601
2602       /* Move on to any more addresses in the header */
2603
2604       s = ss;
2605       }     /* Next address */
2606
2607     parse_allow_group = FALSE;
2608     parse_found_group = FALSE;
2609     }       /* Next header, unless done */
2610   }         /* Next header type unless done */
2611
2612 if (yield == FAIL && *log_msgptr == NULL)
2613   *log_msgptr = US"there is no valid sender in any header line";
2614
2615 if (yield == DEFER && *log_msgptr == NULL)
2616   *log_msgptr = US"all attempts to verify a sender in a header line deferred";
2617
2618 return yield;
2619 }
2620
2621
2622
2623
2624 /*************************************************
2625 *            Get RFC 1413 identification         *
2626 *************************************************/
2627
2628 /* Attempt to get an id from the sending machine via the RFC 1413 protocol. If
2629 the timeout is set to zero, then the query is not done. There may also be lists
2630 of hosts and nets which are exempt. To guard against malefactors sending
2631 non-printing characters which could, for example, disrupt a message's headers,
2632 make sure the string consists of printing characters only.
2633
2634 Argument:
2635   port    the port to connect to; usually this is IDENT_PORT (113), but when
2636           running in the test harness with -bh a different value is used.
2637
2638 Returns:  nothing
2639
2640 Side effect: any received ident value is put in sender_ident (NULL otherwise)
2641 */
2642
2643 void
2644 verify_get_ident(int port)
2645 {
2646 int sock, host_af, qlen;
2647 int received_sender_port, received_interface_port, n;
2648 uschar *p;
2649 uschar buffer[2048];
2650
2651 /* Default is no ident. Check whether we want to do an ident check for this
2652 host. */
2653
2654 sender_ident = NULL;
2655 if (rfc1413_query_timeout <= 0 || verify_check_host(&rfc1413_hosts) != OK)
2656   return;
2657
2658 DEBUG(D_ident) debug_printf("doing ident callback\n");
2659
2660 /* Set up a connection to the ident port of the remote host. Bind the local end
2661 to the incoming interface address. If the sender host address is an IPv6
2662 address, the incoming interface address will also be IPv6. */
2663
2664 host_af = Ustrchr(sender_host_address, ':') == NULL ? AF_INET : AF_INET6;
2665 if ((sock = ip_socket(SOCK_STREAM, host_af)) < 0) return;
2666
2667 if (ip_bind(sock, host_af, interface_address, 0) < 0)
2668   {
2669   DEBUG(D_ident) debug_printf("bind socket for ident failed: %s\n",
2670     strerror(errno));
2671   goto END_OFF;
2672   }
2673
2674 if (ip_connect(sock, host_af, sender_host_address, port,
2675                 rfc1413_query_timeout, TRUE) < 0)
2676   {
2677   if (errno == ETIMEDOUT && LOGGING(ident_timeout))
2678     log_write(0, LOG_MAIN, "ident connection to %s timed out",
2679       sender_host_address);
2680   else
2681     DEBUG(D_ident) debug_printf("ident connection to %s failed: %s\n",
2682       sender_host_address, strerror(errno));
2683   goto END_OFF;
2684   }
2685
2686 /* Construct and send the query. */
2687
2688 sprintf(CS buffer, "%d , %d\r\n", sender_host_port, interface_port);
2689 qlen = Ustrlen(buffer);
2690 if (send(sock, buffer, qlen, 0) < 0)
2691   {
2692   DEBUG(D_ident) debug_printf("ident send failed: %s\n", strerror(errno));
2693   goto END_OFF;
2694   }
2695
2696 /* Read a response line. We put it into the rest of the buffer, using several
2697 recv() calls if necessary. */
2698
2699 p = buffer + qlen;
2700
2701 for (;;)
2702   {
2703   uschar *pp;
2704   int count;
2705   int size = sizeof(buffer) - (p - buffer);
2706
2707   if (size <= 0) goto END_OFF;   /* Buffer filled without seeing \n. */
2708   count = ip_recv(sock, p, size, rfc1413_query_timeout);
2709   if (count <= 0) goto END_OFF;  /* Read error or EOF */
2710
2711   /* Scan what we just read, to see if we have reached the terminating \r\n. Be
2712   generous, and accept a plain \n terminator as well. The only illegal
2713   character is 0. */
2714
2715   for (pp = p; pp < p + count; pp++)
2716     {
2717     if (*pp == 0) goto END_OFF;   /* Zero octet not allowed */
2718     if (*pp == '\n')
2719       {
2720       if (pp[-1] == '\r') pp--;
2721       *pp = 0;
2722       goto GOT_DATA;             /* Break out of both loops */
2723       }
2724     }
2725
2726   /* Reached the end of the data without finding \n. Let the loop continue to
2727   read some more, if there is room. */
2728
2729   p = pp;
2730   }
2731
2732 GOT_DATA:
2733
2734 /* We have received a line of data. Check it carefully. It must start with the
2735 same two port numbers that we sent, followed by data as defined by the RFC. For
2736 example,
2737
2738   12345 , 25 : USERID : UNIX :root
2739
2740 However, the amount of white space may be different to what we sent. In the
2741 "osname" field there may be several sub-fields, comma separated. The data we
2742 actually want to save follows the third colon. Some systems put leading spaces
2743 in it - we discard those. */
2744
2745 if (sscanf(CS buffer + qlen, "%d , %d%n", &received_sender_port,
2746       &received_interface_port, &n) != 2 ||
2747     received_sender_port != sender_host_port ||
2748     received_interface_port != interface_port)
2749   goto END_OFF;
2750
2751 p = buffer + qlen + n;
2752 while(isspace(*p)) p++;
2753 if (*p++ != ':') goto END_OFF;
2754 while(isspace(*p)) p++;
2755 if (Ustrncmp(p, "USERID", 6) != 0) goto END_OFF;
2756 p += 6;
2757 while(isspace(*p)) p++;
2758 if (*p++ != ':') goto END_OFF;
2759 while (*p != 0 && *p != ':') p++;
2760 if (*p++ == 0) goto END_OFF;
2761 while(isspace(*p)) p++;
2762 if (*p == 0) goto END_OFF;
2763
2764 /* The rest of the line is the data we want. We turn it into printing
2765 characters when we save it, so that it cannot mess up the format of any logging
2766 or Received: lines into which it gets inserted. We keep a maximum of 127
2767 characters. The deconst cast is ok as we fed a nonconst to string_printing() */
2768
2769 sender_ident = US string_printing(string_copyn(p, 127));
2770 DEBUG(D_ident) debug_printf("sender_ident = %s\n", sender_ident);
2771
2772 END_OFF:
2773 (void)close(sock);
2774 return;
2775 }
2776
2777
2778
2779
2780 /*************************************************
2781 *      Match host to a single host-list item     *
2782 *************************************************/
2783
2784 /* This function compares a host (name or address) against a single item
2785 from a host list. The host name gets looked up if it is needed and is not
2786 already known. The function is called from verify_check_this_host() via
2787 match_check_list(), which is why most of its arguments are in a single block.
2788
2789 Arguments:
2790   arg            the argument block (see below)
2791   ss             the host-list item
2792   valueptr       where to pass back looked up data, or NULL
2793   error          for error message when returning ERROR
2794
2795 The block contains:
2796   host_name      (a) the host name, or
2797                  (b) NULL, implying use sender_host_name and
2798                        sender_host_aliases, looking them up if required, or
2799                  (c) the empty string, meaning that only IP address matches
2800                        are permitted
2801   host_address   the host address
2802   host_ipv4      the IPv4 address taken from an IPv6 one
2803
2804 Returns:         OK      matched
2805                  FAIL    did not match
2806                  DEFER   lookup deferred
2807                  ERROR   (a) failed to find the host name or IP address, or
2808                          (b) unknown lookup type specified, or
2809                          (c) host name encountered when only IP addresses are
2810                                being matched
2811 */
2812
2813 int
2814 check_host(void *arg, const uschar *ss, const uschar **valueptr, uschar **error)
2815 {
2816 check_host_block *cb = (check_host_block *)arg;
2817 int mlen = -1;
2818 int maskoffset;
2819 BOOL iplookup = FALSE;
2820 BOOL isquery = FALSE;
2821 BOOL isiponly = cb->host_name != NULL && cb->host_name[0] == 0;
2822 const uschar *t;
2823 uschar *semicolon;
2824 uschar **aliases;
2825
2826 /* Optimize for the special case when the pattern is "*". */
2827
2828 if (*ss == '*' && ss[1] == 0) return OK;
2829
2830 /* If the pattern is empty, it matches only in the case when there is no host -
2831 this can occur in ACL checking for SMTP input using the -bs option. In this
2832 situation, the host address is the empty string. */
2833
2834 if (cb->host_address[0] == 0) return (*ss == 0)? OK : FAIL;
2835 if (*ss == 0) return FAIL;
2836
2837 /* If the pattern is precisely "@" then match against the primary host name,
2838 provided that host name matching is permitted; if it's "@[]" match against the
2839 local host's IP addresses. */
2840
2841 if (*ss == '@')
2842   {
2843   if (ss[1] == 0)
2844     {
2845     if (isiponly) return ERROR;
2846     ss = primary_hostname;
2847     }
2848   else if (Ustrcmp(ss, "@[]") == 0)
2849     {
2850     ip_address_item *ip;
2851     for (ip = host_find_interfaces(); ip != NULL; ip = ip->next)
2852       if (Ustrcmp(ip->address, cb->host_address) == 0) return OK;
2853     return FAIL;
2854     }
2855   }
2856
2857 /* If the pattern is an IP address, optionally followed by a bitmask count, do
2858 a (possibly masked) comparison with the current IP address. */
2859
2860 if (string_is_ip_address(ss, &maskoffset) != 0)
2861   return (host_is_in_net(cb->host_address, ss, maskoffset)? OK : FAIL);
2862
2863 /* The pattern is not an IP address. A common error that people make is to omit
2864 one component of an IPv4 address, either by accident, or believing that, for
2865 example, 1.2.3/24 is the same as 1.2.3.0/24, or 1.2.3 is the same as 1.2.3.0,
2866 which it isn't. (Those applications that do accept 1.2.3 as an IP address
2867 interpret it as 1.2.0.3 because the final component becomes 16-bit - this is an
2868 ancient specification.) To aid in debugging these cases, we give a specific
2869 error if the pattern contains only digits and dots or contains a slash preceded
2870 only by digits and dots (a slash at the start indicates a file name and of
2871 course slashes may be present in lookups, but not preceded only by digits and
2872 dots). */
2873
2874 for (t = ss; isdigit(*t) || *t == '.'; t++);
2875 if (*t == 0 || (*t == '/' && t != ss))
2876   {
2877   *error = US"malformed IPv4 address or address mask";
2878   return ERROR;
2879   }
2880
2881 /* See if there is a semicolon in the pattern */
2882
2883 semicolon = Ustrchr(ss, ';');
2884
2885 /* If we are doing an IP address only match, then all lookups must be IP
2886 address lookups, even if there is no "net-". */
2887
2888 if (isiponly)
2889   {
2890   iplookup = semicolon != NULL;
2891   }
2892
2893 /* Otherwise, if the item is of the form net[n]-lookup;<file|query> then it is
2894 a lookup on a masked IP network, in textual form. We obey this code even if we
2895 have already set iplookup, so as to skip over the "net-" prefix and to set the
2896 mask length. The net- stuff really only applies to single-key lookups where the
2897 key is implicit. For query-style lookups the key is specified in the query.
2898 From release 4.30, the use of net- for query style is no longer needed, but we
2899 retain it for backward compatibility. */
2900
2901 if (Ustrncmp(ss, "net", 3) == 0 && semicolon != NULL)
2902   {
2903   mlen = 0;
2904   for (t = ss + 3; isdigit(*t); t++) mlen = mlen * 10 + *t - '0';
2905   if (mlen == 0 && t == ss+3) mlen = -1;  /* No mask supplied */
2906   iplookup = (*t++ == '-');
2907   }
2908 else t = ss;
2909
2910 /* Do the IP address lookup if that is indeed what we have */
2911
2912 if (iplookup)
2913   {
2914   int insize;
2915   int search_type;
2916   int incoming[4];
2917   void *handle;
2918   uschar *filename, *key, *result;
2919   uschar buffer[64];
2920
2921   /* Find the search type */
2922
2923   search_type = search_findtype(t, semicolon - t);
2924
2925   if (search_type < 0) log_write(0, LOG_MAIN|LOG_PANIC_DIE, "%s",
2926     search_error_message);
2927
2928   /* Adjust parameters for the type of lookup. For a query-style lookup, there
2929   is no file name, and the "key" is just the query. For query-style with a file
2930   name, we have to fish the file off the start of the query. For a single-key
2931   lookup, the key is the current IP address, masked appropriately, and
2932   reconverted to text form, with the mask appended. For IPv6 addresses, specify
2933   dot separators instead of colons, except when the lookup type is "iplsearch".
2934   */
2935
2936   if (mac_islookup(search_type, lookup_absfilequery))
2937     {
2938     filename = semicolon + 1;
2939     key = filename;
2940     while (*key != 0 && !isspace(*key)) key++;
2941     filename = string_copyn(filename, key - filename);
2942     while (isspace(*key)) key++;
2943     }
2944   else if (mac_islookup(search_type, lookup_querystyle))
2945     {
2946     filename = NULL;
2947     key = semicolon + 1;
2948     }
2949   else   /* Single-key style */
2950     {
2951     int sep = (Ustrcmp(lookup_list[search_type]->name, "iplsearch") == 0)?
2952       ':' : '.';
2953     insize = host_aton(cb->host_address, incoming);
2954     host_mask(insize, incoming, mlen);
2955     (void)host_nmtoa(insize, incoming, mlen, buffer, sep);
2956     key = buffer;
2957     filename = semicolon + 1;
2958     }
2959
2960   /* Now do the actual lookup; note that there is no search_close() because
2961   of the caching arrangements. */
2962
2963   if (!(handle = search_open(filename, search_type, 0, NULL, NULL)))
2964     log_write(0, LOG_MAIN|LOG_PANIC_DIE, "%s", search_error_message);
2965
2966   result = search_find(handle, filename, key, -1, NULL, 0, 0, NULL);
2967   if (valueptr != NULL) *valueptr = result;
2968   return (result != NULL)? OK : search_find_defer? DEFER: FAIL;
2969   }
2970
2971 /* The pattern is not an IP address or network reference of any kind. That is,
2972 it is a host name pattern. If this is an IP only match, there's an error in the
2973 host list. */
2974
2975 if (isiponly)
2976   {
2977   *error = US"cannot match host name in match_ip list";
2978   return ERROR;
2979   }
2980
2981 /* Check the characters of the pattern to see if they comprise only letters,
2982 digits, full stops, and hyphens (the constituents of domain names). Allow
2983 underscores, as they are all too commonly found. Sigh. Also, if
2984 allow_utf8_domains is set, allow top-bit characters. */
2985
2986 for (t = ss; *t != 0; t++)
2987   if (!isalnum(*t) && *t != '.' && *t != '-' && *t != '_' &&
2988       (!allow_utf8_domains || *t < 128)) break;
2989
2990 /* If the pattern is a complete domain name, with no fancy characters, look up
2991 its IP address and match against that. Note that a multi-homed host will add
2992 items to the chain. */
2993
2994 if (*t == 0)
2995   {
2996   int rc;
2997   host_item h;
2998   h.next = NULL;
2999   h.name = ss;
3000   h.address = NULL;
3001   h.mx = MX_NONE;
3002
3003   /* Using byname rather than bydns here means we cannot determine dnssec
3004   status.  On the other hand it is unclear how that could be either
3005   propagated up or enforced. */
3006
3007   rc = host_find_byname(&h, NULL, HOST_FIND_QUALIFY_SINGLE, NULL, FALSE);
3008   if (rc == HOST_FOUND || rc == HOST_FOUND_LOCAL)
3009     {
3010     host_item *hh;
3011     for (hh = &h; hh != NULL; hh = hh->next)
3012       {
3013       if (host_is_in_net(hh->address, cb->host_address, 0)) return OK;
3014       }
3015     return FAIL;
3016     }
3017   if (rc == HOST_FIND_AGAIN) return DEFER;
3018   *error = string_sprintf("failed to find IP address for %s", ss);
3019   return ERROR;
3020   }
3021
3022 /* Almost all subsequent comparisons require the host name, and can be done
3023 using the general string matching function. When this function is called for
3024 outgoing hosts, the name is always given explicitly. If it is NULL, it means we
3025 must use sender_host_name and its aliases, looking them up if necessary. */
3026
3027 if (cb->host_name != NULL)   /* Explicit host name given */
3028   return match_check_string(cb->host_name, ss, -1, TRUE, TRUE, TRUE,
3029     valueptr);
3030
3031 /* Host name not given; in principle we need the sender host name and its
3032 aliases. However, for query-style lookups, we do not need the name if the
3033 query does not contain $sender_host_name. From release 4.23, a reference to
3034 $sender_host_name causes it to be looked up, so we don't need to do the lookup
3035 on spec. */
3036
3037 if ((semicolon = Ustrchr(ss, ';')) != NULL)
3038   {
3039   const uschar *affix;
3040   int partial, affixlen, starflags, id;
3041
3042   *semicolon = 0;
3043   id = search_findtype_partial(ss, &partial, &affix, &affixlen, &starflags);
3044   *semicolon=';';
3045
3046   if (id < 0)                           /* Unknown lookup type */
3047     {
3048     log_write(0, LOG_MAIN|LOG_PANIC, "%s in host list item \"%s\"",
3049       search_error_message, ss);
3050     return DEFER;
3051     }
3052   isquery = mac_islookup(id, lookup_querystyle|lookup_absfilequery);
3053   }
3054
3055 if (isquery)
3056   {
3057   switch(match_check_string(US"", ss, -1, TRUE, TRUE, TRUE, valueptr))
3058     {
3059     case OK:    return OK;
3060     case DEFER: return DEFER;
3061     default:    return FAIL;
3062     }
3063   }
3064
3065 /* Not a query-style lookup; must ensure the host name is present, and then we
3066 do a check on the name and all its aliases. */
3067
3068 if (sender_host_name == NULL)
3069   {
3070   HDEBUG(D_host_lookup)
3071     debug_printf("sender host name required, to match against %s\n", ss);
3072   if (host_lookup_failed || host_name_lookup() != OK)
3073     {
3074     *error = string_sprintf("failed to find host name for %s",
3075       sender_host_address);;
3076     return ERROR;
3077     }
3078   host_build_sender_fullhost();
3079   }
3080
3081 /* Match on the sender host name, using the general matching function */
3082
3083 switch(match_check_string(sender_host_name, ss, -1, TRUE, TRUE, TRUE,
3084        valueptr))
3085   {
3086   case OK:    return OK;
3087   case DEFER: return DEFER;
3088   }
3089
3090 /* If there are aliases, try matching on them. */
3091
3092 aliases = sender_host_aliases;
3093 while (*aliases != NULL)
3094   {
3095   switch(match_check_string(*aliases++, ss, -1, TRUE, TRUE, TRUE, valueptr))
3096     {
3097     case OK:    return OK;
3098     case DEFER: return DEFER;
3099     }
3100   }
3101 return FAIL;
3102 }
3103
3104
3105
3106
3107 /*************************************************
3108 *    Check a specific host matches a host list   *
3109 *************************************************/
3110
3111 /* This function is passed a host list containing items in a number of
3112 different formats and the identity of a host. Its job is to determine whether
3113 the given host is in the set of hosts defined by the list. The host name is
3114 passed as a pointer so that it can be looked up if needed and not already
3115 known. This is commonly the case when called from verify_check_host() to check
3116 an incoming connection. When called from elsewhere the host name should usually
3117 be set.
3118
3119 This function is now just a front end to match_check_list(), which runs common
3120 code for scanning a list. We pass it the check_host() function to perform a
3121 single test.
3122
3123 Arguments:
3124   listptr              pointer to the host list
3125   cache_bits           pointer to cache for named lists, or NULL
3126   host_name            the host name or NULL, implying use sender_host_name and
3127                          sender_host_aliases, looking them up if required
3128   host_address         the IP address
3129   valueptr             if not NULL, data from a lookup is passed back here
3130
3131 Returns:    OK    if the host is in the defined set
3132             FAIL  if the host is not in the defined set,
3133             DEFER if a data lookup deferred (not a host lookup)
3134
3135 If the host name was needed in order to make a comparison, and could not be
3136 determined from the IP address, the result is FAIL unless the item
3137 "+allow_unknown" was met earlier in the list, in which case OK is returned. */
3138
3139 int
3140 verify_check_this_host(const uschar **listptr, unsigned int *cache_bits,
3141   const uschar *host_name, const uschar *host_address, const uschar **valueptr)
3142 {
3143 int rc;
3144 unsigned int *local_cache_bits = cache_bits;
3145 const uschar *save_host_address = deliver_host_address;
3146 check_host_block cb;
3147 cb.host_name = host_name;
3148 cb.host_address = host_address;
3149
3150 if (valueptr != NULL) *valueptr = NULL;
3151
3152 /* If the host address starts off ::ffff: it is an IPv6 address in
3153 IPv4-compatible mode. Find the IPv4 part for checking against IPv4
3154 addresses. */
3155
3156 cb.host_ipv4 = (Ustrncmp(host_address, "::ffff:", 7) == 0)?
3157   host_address + 7 : host_address;
3158
3159 /* During the running of the check, put the IP address into $host_address. In
3160 the case of calls from the smtp transport, it will already be there. However,
3161 in other calls (e.g. when testing ignore_target_hosts), it won't. Just to be on
3162 the safe side, any existing setting is preserved, though as I write this
3163 (November 2004) I can't see any cases where it is actually needed. */
3164
3165 deliver_host_address = host_address;
3166 rc = match_check_list(
3167        listptr,                                /* the list */
3168        0,                                      /* separator character */
3169        &hostlist_anchor,                       /* anchor pointer */
3170        &local_cache_bits,                      /* cache pointer */
3171        check_host,                             /* function for testing */
3172        &cb,                                    /* argument for function */
3173        MCL_HOST,                               /* type of check */
3174        (host_address == sender_host_address)?
3175          US"host" : host_address,              /* text for debugging */
3176        valueptr);                              /* where to pass back data */
3177 deliver_host_address = save_host_address;
3178 return rc;
3179 }
3180
3181
3182
3183
3184 /*************************************************
3185 *      Check the given host item matches a list  *
3186 *************************************************/
3187 int
3188 verify_check_given_host(uschar **listptr, host_item *host)
3189 {
3190 return verify_check_this_host(CUSS listptr, NULL, host->name, host->address, NULL);
3191 }
3192
3193 /*************************************************
3194 *      Check the remote host matches a list      *
3195 *************************************************/
3196
3197 /* This is a front end to verify_check_this_host(), created because checking
3198 the remote host is a common occurrence. With luck, a good compiler will spot
3199 the tail recursion and optimize it. If there's no host address, this is
3200 command-line SMTP input - check against an empty string for the address.
3201
3202 Arguments:
3203   listptr              pointer to the host list
3204
3205 Returns:               the yield of verify_check_this_host(),
3206                        i.e. OK, FAIL, or DEFER
3207 */
3208
3209 int
3210 verify_check_host(uschar **listptr)
3211 {
3212 return verify_check_this_host(CUSS listptr, sender_host_cache, NULL,
3213   (sender_host_address == NULL)? US"" : sender_host_address, NULL);
3214 }
3215
3216
3217
3218
3219
3220 /*************************************************
3221 *              Invert an IP address              *
3222 *************************************************/
3223
3224 /* Originally just used for DNS xBL lists, now also used for the
3225 reverse_ip expansion operator.
3226
3227 Arguments:
3228   buffer         where to put the answer
3229   address        the address to invert
3230 */
3231
3232 void
3233 invert_address(uschar *buffer, uschar *address)
3234 {
3235 int bin[4];
3236 uschar *bptr = buffer;
3237
3238 /* If this is an IPv4 address mapped into IPv6 format, adjust the pointer
3239 to the IPv4 part only. */
3240
3241 if (Ustrncmp(address, "::ffff:", 7) == 0) address += 7;
3242
3243 /* Handle IPv4 address: when HAVE_IPV6 is false, the result of host_aton() is
3244 always 1. */
3245
3246 if (host_aton(address, bin) == 1)
3247   {
3248   int i;
3249   int x = bin[0];
3250   for (i = 0; i < 4; i++)
3251     {
3252     sprintf(CS bptr, "%d.", x & 255);
3253     while (*bptr) bptr++;
3254     x >>= 8;
3255     }
3256   }
3257
3258 /* Handle IPv6 address. Actually, as far as I know, there are no IPv6 addresses
3259 in any DNS black lists, and the format in which they will be looked up is
3260 unknown. This is just a guess. */
3261
3262 #if HAVE_IPV6
3263 else
3264   {
3265   int i, j;
3266   for (j = 3; j >= 0; j--)
3267     {
3268     int x = bin[j];
3269     for (i = 0; i < 8; i++)
3270       {
3271       sprintf(CS bptr, "%x.", x & 15);
3272       while (*bptr) bptr++;
3273       x >>= 4;
3274       }
3275     }
3276   }
3277 #endif
3278
3279 /* Remove trailing period -- this is needed so that both arbitrary
3280 dnsbl keydomains and inverted addresses may be combined with the
3281 same format string, "%s.%s" */
3282
3283 *(--bptr) = 0;
3284 }
3285
3286
3287
3288 /*************************************************
3289 *          Perform a single dnsbl lookup         *
3290 *************************************************/
3291
3292 /* This function is called from verify_check_dnsbl() below. It is also called
3293 recursively from within itself when domain and domain_txt are different
3294 pointers, in order to get the TXT record from the alternate domain.
3295
3296 Arguments:
3297   domain         the outer dnsbl domain
3298   domain_txt     alternate domain to lookup TXT record on success; when the
3299                    same domain is to be used, domain_txt == domain (that is,
3300                    the pointers must be identical, not just the text)
3301   keydomain      the current keydomain (for debug message)
3302   prepend        subdomain to lookup (like keydomain, but
3303                    reversed if IP address)
3304   iplist         the list of matching IP addresses, or NULL for "any"
3305   bitmask        true if bitmask matching is wanted
3306   match_type     condition for 'succeed' result
3307                    0 => Any RR in iplist     (=)
3308                    1 => No RR in iplist      (!=)
3309                    2 => All RRs in iplist    (==)
3310                    3 => Some RRs not in iplist (!==)
3311                    the two bits are defined as MT_NOT and MT_ALL
3312   defer_return   what to return for a defer
3313
3314 Returns:         OK if lookup succeeded
3315                  FAIL if not
3316 */
3317
3318 static int
3319 one_check_dnsbl(uschar *domain, uschar *domain_txt, uschar *keydomain,
3320   uschar *prepend, uschar *iplist, BOOL bitmask, int match_type,
3321   int defer_return)
3322 {
3323 dns_answer dnsa;
3324 dns_scan dnss;
3325 tree_node *t;
3326 dnsbl_cache_block *cb;
3327 int old_pool = store_pool;
3328 uschar query[256];         /* DNS domain max length */
3329
3330 /* Construct the specific query domainname */
3331
3332 if (!string_format(query, sizeof(query), "%s.%s", prepend, domain))
3333   {
3334   log_write(0, LOG_MAIN|LOG_PANIC, "dnslist query is too long "
3335     "(ignored): %s...", query);
3336   return FAIL;
3337   }
3338
3339 /* Look for this query in the cache. */
3340
3341 if (  (t = tree_search(dnsbl_cache, query))
3342    && (cb = t->data.ptr)->expiry > time(NULL)
3343    )
3344
3345 /* Previous lookup was cached */
3346
3347   {
3348   HDEBUG(D_dnsbl) debug_printf("using result of previous DNS lookup\n");
3349   }
3350
3351 /* If not cached from a previous lookup, we must do a DNS lookup, and
3352 cache the result in permanent memory. */
3353
3354 else
3355   {
3356   uint ttl = 3600;
3357
3358   store_pool = POOL_PERM;
3359
3360   if (t)
3361     {
3362     HDEBUG(D_dnsbl) debug_printf("cached data found but past valid time; ");
3363     }
3364
3365   else
3366     {   /* Set up a tree entry to cache the lookup */
3367     t = store_get(sizeof(tree_node) + Ustrlen(query));
3368     Ustrcpy(t->name, query);
3369     t->data.ptr = cb = store_get(sizeof(dnsbl_cache_block));
3370     (void)tree_insertnode(&dnsbl_cache, t);
3371     }
3372
3373   /* Do the DNS lookup . */
3374
3375   HDEBUG(D_dnsbl) debug_printf("new DNS lookup for %s\n", query);
3376   cb->rc = dns_basic_lookup(&dnsa, query, T_A);
3377   cb->text_set = FALSE;
3378   cb->text = NULL;
3379   cb->rhs = NULL;
3380
3381   /* If the lookup succeeded, cache the RHS address. The code allows for
3382   more than one address - this was for complete generality and the possible
3383   use of A6 records. However, A6 records have been reduced to experimental
3384   status (August 2001) and may die out. So they may never get used at all,
3385   let alone in dnsbl records. However, leave the code here, just in case.
3386
3387   Quite apart from one A6 RR generating multiple addresses, there are DNS
3388   lists that return more than one A record, so we must handle multiple
3389   addresses generated in that way as well.
3390
3391   Mark the cache entry with the "now" plus the minimum of the address TTLs,
3392   or some suitably far-future time if none were found. */
3393
3394   if (cb->rc == DNS_SUCCEED)
3395     {
3396     dns_record *rr;
3397     dns_address **addrp = &(cb->rhs);
3398     for (rr = dns_next_rr(&dnsa, &dnss, RESET_ANSWERS);
3399          rr;
3400          rr = dns_next_rr(&dnsa, &dnss, RESET_NEXT))
3401       {
3402       if (rr->type == T_A)
3403         {
3404         dns_address *da = dns_address_from_rr(&dnsa, rr);
3405         if (da)
3406           {
3407           *addrp = da;
3408           while (da->next != NULL) da = da->next;
3409           addrp = &(da->next);
3410           if (ttl > rr->ttl) ttl = rr->ttl;
3411           }
3412         }
3413       }
3414
3415     /* If we didn't find any A records, change the return code. This can
3416     happen when there is a CNAME record but there are no A records for what
3417     it points to. */
3418
3419     if (cb->rhs == NULL) cb->rc = DNS_NODATA;
3420     }
3421
3422   cb->expiry = time(NULL)+ttl;
3423   store_pool = old_pool;
3424   }
3425
3426 /* We now have the result of the DNS lookup, either newly done, or cached
3427 from a previous call. If the lookup succeeded, check against the address
3428 list if there is one. This may be a positive equality list (introduced by
3429 "="), a negative equality list (introduced by "!="), a positive bitmask
3430 list (introduced by "&"), or a negative bitmask list (introduced by "!&").*/
3431
3432 if (cb->rc == DNS_SUCCEED)
3433   {
3434   dns_address *da = NULL;
3435   uschar *addlist = cb->rhs->address;
3436
3437   /* For A and AAAA records, there may be multiple addresses from multiple
3438   records. For A6 records (currently not expected to be used) there may be
3439   multiple addresses from a single record. */
3440
3441   for (da = cb->rhs->next; da != NULL; da = da->next)
3442     addlist = string_sprintf("%s, %s", addlist, da->address);
3443
3444   HDEBUG(D_dnsbl) debug_printf("DNS lookup for %s succeeded (yielding %s)\n",
3445     query, addlist);
3446
3447   /* Address list check; this can be either for equality, or via a bitmask.
3448   In the latter case, all the bits must match. */
3449
3450   if (iplist != NULL)
3451     {
3452     for (da = cb->rhs; da != NULL; da = da->next)
3453       {
3454       int ipsep = ',';
3455       uschar ip[46];
3456       const uschar *ptr = iplist;
3457       uschar *res;
3458
3459       /* Handle exact matching */
3460
3461       if (!bitmask)
3462         {
3463         while ((res = string_nextinlist(&ptr, &ipsep, ip, sizeof(ip))) != NULL)
3464           {
3465           if (Ustrcmp(CS da->address, ip) == 0) break;
3466           }
3467         }
3468
3469       /* Handle bitmask matching */
3470
3471       else
3472         {
3473         int address[4];
3474         int mask = 0;
3475
3476         /* At present, all known DNS blocking lists use A records, with
3477         IPv4 addresses on the RHS encoding the information they return. I
3478         wonder if this will linger on as the last vestige of IPv4 when IPv6
3479         is ubiquitous? Anyway, for now we use paranoia code to completely
3480         ignore IPv6 addresses. The default mask is 0, which always matches.
3481         We change this only for IPv4 addresses in the list. */
3482
3483         if (host_aton(da->address, address) == 1) mask = address[0];
3484
3485         /* Scan the returned addresses, skipping any that are IPv6 */
3486
3487         while ((res = string_nextinlist(&ptr, &ipsep, ip, sizeof(ip))) != NULL)
3488           {
3489           if (host_aton(ip, address) != 1) continue;
3490           if ((address[0] & mask) == address[0]) break;
3491           }
3492         }
3493
3494       /* If either
3495
3496          (a) An IP address in an any ('=') list matched, or
3497          (b) No IP address in an all ('==') list matched
3498
3499       then we're done searching. */
3500
3501       if (((match_type & MT_ALL) != 0) == (res == NULL)) break;
3502       }
3503
3504     /* If da == NULL, either
3505
3506        (a) No IP address in an any ('=') list matched, or
3507        (b) An IP address in an all ('==') list didn't match
3508
3509     so behave as if the DNSBL lookup had not succeeded, i.e. the host is not on
3510     the list. */
3511
3512     if ((match_type == MT_NOT || match_type == MT_ALL) != (da == NULL))
3513       {
3514       HDEBUG(D_dnsbl)
3515         {
3516         uschar *res = NULL;
3517         switch(match_type)
3518           {
3519           case 0:
3520           res = US"was no match";
3521           break;
3522           case MT_NOT:
3523           res = US"was an exclude match";
3524           break;
3525           case MT_ALL:
3526           res = US"was an IP address that did not match";
3527           break;
3528           case MT_NOT|MT_ALL:
3529           res = US"were no IP addresses that did not match";
3530           break;
3531           }
3532         debug_printf("=> but we are not accepting this block class because\n");
3533         debug_printf("=> there %s for %s%c%s\n",
3534           res,
3535           ((match_type & MT_ALL) == 0)? "" : "=",
3536           bitmask? '&' : '=', iplist);
3537         }
3538       return FAIL;
3539       }
3540     }
3541
3542   /* Either there was no IP list, or the record matched, implying that the
3543   domain is on the list. We now want to find a corresponding TXT record. If an
3544   alternate domain is specified for the TXT record, call this function
3545   recursively to look that up; this has the side effect of re-checking that
3546   there is indeed an A record at the alternate domain. */
3547
3548   if (domain_txt != domain)
3549     return one_check_dnsbl(domain_txt, domain_txt, keydomain, prepend, NULL,
3550       FALSE, match_type, defer_return);
3551
3552   /* If there is no alternate domain, look up a TXT record in the main domain
3553   if it has not previously been cached. */
3554
3555   if (!cb->text_set)
3556     {
3557     cb->text_set = TRUE;
3558     if (dns_basic_lookup(&dnsa, query, T_TXT) == DNS_SUCCEED)
3559       {
3560       dns_record *rr;
3561       for (rr = dns_next_rr(&dnsa, &dnss, RESET_ANSWERS);
3562            rr != NULL;
3563            rr = dns_next_rr(&dnsa, &dnss, RESET_NEXT))
3564         if (rr->type == T_TXT) break;
3565       if (rr != NULL)
3566         {
3567         int len = (rr->data)[0];
3568         if (len > 511) len = 127;
3569         store_pool = POOL_PERM;
3570         cb->text = string_sprintf("%.*s", len, (const uschar *)(rr->data+1));
3571         store_pool = old_pool;
3572         }
3573       }
3574     }
3575
3576   dnslist_value = addlist;
3577   dnslist_text = cb->text;
3578   return OK;
3579   }
3580
3581 /* There was a problem with the DNS lookup */
3582
3583 if (cb->rc != DNS_NOMATCH && cb->rc != DNS_NODATA)
3584   {
3585   log_write(L_dnslist_defer, LOG_MAIN,
3586     "DNS list lookup defer (probably timeout) for %s: %s", query,
3587     (defer_return == OK)?   US"assumed in list" :
3588     (defer_return == FAIL)? US"assumed not in list" :
3589                             US"returned DEFER");
3590   return defer_return;
3591   }
3592
3593 /* No entry was found in the DNS; continue for next domain */
3594
3595 HDEBUG(D_dnsbl)
3596   {
3597   debug_printf("DNS lookup for %s failed\n", query);
3598   debug_printf("=> that means %s is not listed at %s\n",
3599      keydomain, domain);
3600   }
3601
3602 return FAIL;
3603 }
3604
3605
3606
3607
3608 /*************************************************
3609 *        Check host against DNS black lists      *
3610 *************************************************/
3611
3612 /* This function runs checks against a list of DNS black lists, until one
3613 matches. Each item on the list can be of the form
3614
3615   domain=ip-address/key
3616
3617 The domain is the right-most domain that is used for the query, for example,
3618 blackholes.mail-abuse.org. If the IP address is present, there is a match only
3619 if the DNS lookup returns a matching IP address. Several addresses may be
3620 given, comma-separated, for example: x.y.z=127.0.0.1,127.0.0.2.
3621
3622 If no key is given, what is looked up in the domain is the inverted IP address
3623 of the current client host. If a key is given, it is used to construct the
3624 domain for the lookup. For example:
3625
3626   dsn.rfc-ignorant.org/$sender_address_domain
3627
3628 After finding a match in the DNS, the domain is placed in $dnslist_domain, and
3629 then we check for a TXT record for an error message, and if found, save its
3630 value in $dnslist_text. We also cache everything in a tree, to optimize
3631 multiple lookups.
3632
3633 The TXT record is normally looked up in the same domain as the A record, but
3634 when many lists are combined in a single DNS domain, this will not be a very
3635 specific message. It is possible to specify a different domain for looking up
3636 TXT records; this is given before the main domain, comma-separated. For
3637 example:
3638
3639   dnslists = http.dnsbl.sorbs.net,dnsbl.sorbs.net=127.0.0.2 : \
3640              socks.dnsbl.sorbs.net,dnsbl.sorbs.net=127.0.0.3
3641
3642 The caching ensures that only one lookup in dnsbl.sorbs.net is done.
3643
3644 Note: an address for testing RBL is 192.203.178.39
3645 Note: an address for testing DUL is 192.203.178.4
3646 Note: a domain for testing RFCI is example.tld.dsn.rfc-ignorant.org
3647
3648 Arguments:
3649   where        the acl type
3650   listptr      the domain/address/data list
3651   log_msgptr   log message on error
3652
3653 Returns:    OK      successful lookup (i.e. the address is on the list), or
3654                       lookup deferred after +include_unknown
3655             FAIL    name not found, or no data found for the given type, or
3656                       lookup deferred after +exclude_unknown (default)
3657             DEFER   lookup failure, if +defer_unknown was set
3658 */
3659
3660 int
3661 verify_check_dnsbl(int where, const uschar ** listptr, uschar ** log_msgptr)
3662 {
3663 int sep = 0;
3664 int defer_return = FAIL;
3665 const uschar *list = *listptr;
3666 uschar *domain;
3667 uschar *s;
3668 uschar buffer[1024];
3669 uschar revadd[128];        /* Long enough for IPv6 address */
3670
3671 /* Indicate that the inverted IP address is not yet set up */
3672
3673 revadd[0] = 0;
3674
3675 /* In case this is the first time the DNS resolver is being used. */
3676
3677 dns_init(FALSE, FALSE, FALSE);  /*XXX dnssec? */
3678
3679 /* Loop through all the domains supplied, until something matches */
3680
3681 while ((domain = string_nextinlist(&list, &sep, buffer, sizeof(buffer))) != NULL)
3682   {
3683   int rc;
3684   BOOL bitmask = FALSE;
3685   int match_type = 0;
3686   uschar *domain_txt;
3687   uschar *comma;
3688   uschar *iplist;
3689   uschar *key;
3690
3691   HDEBUG(D_dnsbl) debug_printf("DNS list check: %s\n", domain);
3692
3693   /* Deal with special values that change the behaviour on defer */
3694
3695   if (domain[0] == '+')
3696     {
3697     if      (strcmpic(domain, US"+include_unknown") == 0) defer_return = OK;
3698     else if (strcmpic(domain, US"+exclude_unknown") == 0) defer_return = FAIL;
3699     else if (strcmpic(domain, US"+defer_unknown") == 0)   defer_return = DEFER;
3700     else
3701       log_write(0, LOG_MAIN|LOG_PANIC, "unknown item in dnslist (ignored): %s",
3702         domain);
3703     continue;
3704     }
3705
3706   /* See if there's explicit data to be looked up */
3707
3708   if ((key = Ustrchr(domain, '/'))) *key++ = 0;
3709
3710   /* See if there's a list of addresses supplied after the domain name. This is
3711   introduced by an = or a & character; if preceded by = we require all matches
3712   and if preceded by ! we invert the result. */
3713
3714   if (!(iplist = Ustrchr(domain, '=')))
3715     {
3716     bitmask = TRUE;
3717     iplist = Ustrchr(domain, '&');
3718     }
3719
3720   if (iplist)                                  /* Found either = or & */
3721     {
3722     if (iplist > domain && iplist[-1] == '!')  /* Handle preceding ! */
3723       {
3724       match_type |= MT_NOT;
3725       iplist[-1] = 0;
3726       }
3727
3728     *iplist++ = 0;                             /* Terminate domain, move on */
3729
3730     /* If we found = (bitmask == FALSE), check for == or =& */
3731
3732     if (!bitmask && (*iplist == '=' || *iplist == '&'))
3733       {
3734       bitmask = *iplist++ == '&';
3735       match_type |= MT_ALL;
3736       }
3737     }
3738
3739
3740   /* If there is a comma in the domain, it indicates that a second domain for
3741   looking up TXT records is provided, before the main domain. Otherwise we must
3742   set domain_txt == domain. */
3743
3744   domain_txt = domain;
3745   comma = Ustrchr(domain, ',');
3746   if (comma != NULL)
3747     {
3748     *comma++ = 0;
3749     domain = comma;
3750     }
3751
3752   /* Check that what we have left is a sensible domain name. There is no reason
3753   why these domains should in fact use the same syntax as hosts and email
3754   domains, but in practice they seem to. However, there is little point in
3755   actually causing an error here, because that would no doubt hold up incoming
3756   mail. Instead, I'll just log it. */
3757
3758   for (s = domain; *s != 0; s++)
3759     {
3760     if (!isalnum(*s) && *s != '-' && *s != '.' && *s != '_')
3761       {
3762       log_write(0, LOG_MAIN, "dnslists domain \"%s\" contains "
3763         "strange characters - is this right?", domain);
3764       break;
3765       }
3766     }
3767
3768   /* Check the alternate domain if present */
3769
3770   if (domain_txt != domain) for (s = domain_txt; *s != 0; s++)
3771     {
3772     if (!isalnum(*s) && *s != '-' && *s != '.' && *s != '_')
3773       {
3774       log_write(0, LOG_MAIN, "dnslists domain \"%s\" contains "
3775         "strange characters - is this right?", domain_txt);
3776       break;
3777       }
3778     }
3779
3780   /* If there is no key string, construct the query by adding the domain name
3781   onto the inverted host address, and perform a single DNS lookup. */
3782
3783   if (key == NULL)
3784     {
3785     if (where == ACL_WHERE_NOTSMTP_START || where == ACL_WHERE_NOTSMTP)
3786       {
3787       *log_msgptr = string_sprintf
3788         ("cannot test auto-keyed dnslists condition in %s ACL",
3789           acl_wherenames[where]);
3790       return ERROR;
3791       }
3792     if (sender_host_address == NULL) return FAIL;    /* can never match */
3793     if (revadd[0] == 0) invert_address(revadd, sender_host_address);
3794     rc = one_check_dnsbl(domain, domain_txt, sender_host_address, revadd,
3795       iplist, bitmask, match_type, defer_return);
3796     if (rc == OK)
3797       {
3798       dnslist_domain = string_copy(domain_txt);
3799       dnslist_matched = string_copy(sender_host_address);
3800       HDEBUG(D_dnsbl) debug_printf("=> that means %s is listed at %s\n",
3801         sender_host_address, dnslist_domain);
3802       }
3803     if (rc != FAIL) return rc;     /* OK or DEFER */
3804     }
3805
3806   /* If there is a key string, it can be a list of domains or IP addresses to
3807   be concatenated with the main domain. */
3808
3809   else
3810     {
3811     int keysep = 0;
3812     BOOL defer = FALSE;
3813     uschar *keydomain;
3814     uschar keybuffer[256];
3815     uschar keyrevadd[128];
3816
3817     while ((keydomain = string_nextinlist(CUSS &key, &keysep, keybuffer,
3818             sizeof(keybuffer))) != NULL)
3819       {
3820       uschar *prepend = keydomain;
3821
3822       if (string_is_ip_address(keydomain, NULL) != 0)
3823         {
3824         invert_address(keyrevadd, keydomain);
3825         prepend = keyrevadd;
3826         }
3827
3828       rc = one_check_dnsbl(domain, domain_txt, keydomain, prepend, iplist,
3829         bitmask, match_type, defer_return);
3830
3831       if (rc == OK)
3832         {
3833         dnslist_domain = string_copy(domain_txt);
3834         dnslist_matched = string_copy(keydomain);
3835         HDEBUG(D_dnsbl) debug_printf("=> that means %s is listed at %s\n",
3836           keydomain, dnslist_domain);
3837         return OK;
3838         }
3839
3840       /* If the lookup deferred, remember this fact. We keep trying the rest
3841       of the list to see if we get a useful result, and if we don't, we return
3842       DEFER at the end. */
3843
3844       if (rc == DEFER) defer = TRUE;
3845       }    /* continue with next keystring domain/address */
3846
3847     if (defer) return DEFER;
3848     }
3849   }        /* continue with next dnsdb outer domain */
3850
3851 return FAIL;
3852 }
3853
3854 /* vi: aw ai sw=2
3855 */
3856 /* End of verify.c */