src/src/daemon.c

   1 /*************************************************
   2 *     Exim - an Internet mail transport agent    *
   3 *************************************************/
   4
   5 /* Copyright (c) The Exim Maintainers 2020 - 2024 */
   6 /* Copyright (c) University of Cambridge 1995 - 2018 */
   7 /* See the file NOTICE for conditions of use and distribution. */
   8 /* SPDX-License-Identifier: GPL-2.0-or-later */
   9
  10 /* Functions concerned with running Exim as a daemon */
  11
  12
  13 #include "exim.h"
  14
  15
  16 /* Structure for holding data for each SMTP connection */
  17
  18 typedef struct smtp_slot {
  19   pid_t         pid;            /* pid of the spawned reception process */
  20   uschar *      host_address;   /* address of the client host */
  21 } smtp_slot;
  22
  23 typedef struct runner_slot {
  24   pid_t         pid;            /* pid of spawned queue-runner process */
  25   const uschar *queue_name;     /* pointer to the name in the qrunner struct */
  26 } runner_slot;
  27
  28 /* An empty slot for initializing (Standard C does not allow constructor
  29 expressions in assignments except as initializers in declarations). */
  30
  31 static smtp_slot empty_smtp_slot = { .pid = 0, .host_address = NULL };
  32
  33 /*************************************************
  34 *               Local static variables           *
  35 *************************************************/
  36
  37 static SIGNAL_BOOL sigchld_seen;
  38 static SIGNAL_BOOL sighup_seen;
  39 static SIGNAL_BOOL sigterm_seen;
  40
  41 static int   accept_retry_count = 0;
  42 static int   accept_retry_errno;
  43 static BOOL  accept_retry_select_failed;
  44
  45 static int   queue_run_count = 0;       /* current runners */
  46
  47 static unsigned queue_runner_slot_count = 0;
  48 static runner_slot * queue_runner_slots = NULL;
  49 static smtp_slot * smtp_slots = NULL;
  50
  51 static BOOL  write_pid = TRUE;
  52
  53 #ifndef EXIM_HAVE_ABSTRACT_UNIX_SOCKETS
  54 static uschar * notifier_socket_name;
  55 #endif
  56
  57
  58 /*************************************************
  59 *             SIGHUP Handler                     *
  60 *************************************************/
  61
  62 /* All this handler does is to set a flag and re-enable the signal.
  63
  64 Argument: the signal number
  65 Returns:  nothing
  66 */
  67
  68 static void
  69 sighup_handler(int sig)
  70 {
  71 sighup_seen = TRUE;
  72 signal(SIGHUP, sighup_handler);
  73 }
  74
  75
  76
  77 /*************************************************
  78 *     SIGCHLD handler for main daemon process    *
  79 *************************************************/
  80
  81 /* Don't re-enable the handler here, since we aren't doing the
  82 waiting here. If the signal is re-enabled, there will just be an
  83 infinite sequence of calls to this handler. The SIGCHLD signal is
  84 used just as a means of waking up the daemon so that it notices
  85 terminated subprocesses as soon as possible.
  86
  87 Argument: the signal number
  88 Returns:  nothing
  89 */
  90
  91 static void
  92 main_sigchld_handler(int sig)
  93 {
  94 os_non_restarting_signal(SIGCHLD, SIG_DFL);
  95 sigchld_seen = TRUE;
  96 }
  97
  98
  99 /* SIGTERM handler.  Try to get the daemon pid file removed
 100 before exiting. */
 101
 102 static void
 103 main_sigterm_handler(int sig)
 104 {
 105 sigterm_seen = TRUE;
 106 }
 107
 108
 109
 110
 111 /*************************************************
 112 *          Unexpected errors in SMTP calls       *
 113 *************************************************/
 114
 115 /* This function just saves a bit of repetitious coding.
 116
 117 Arguments:
 118   log_msg        Text of message to be logged
 119   smtp_msg       Text of SMTP error message
 120   was_errno      The failing errno
 121
 122 Returns:         nothing
 123 */
 124
 125 static void
 126 never_error(uschar *log_msg, uschar *smtp_msg, int was_errno)
 127 {
 128 uschar *emsg = was_errno <= 0
 129   ? US"" : string_sprintf(": %s", strerror(was_errno));
 130 log_write(0, LOG_MAIN|LOG_PANIC, "%s%s", log_msg, emsg);
 131 if (smtp_out) smtp_printf("421 %s\r\n", SP_NO_MORE, smtp_msg);
 132 }
 133
 134
 135
 136
 137 /*************************************************
 138 *************************************************/
 139
 140 static void
 141 unlink_notifier_socket(void)
 142 {
 143 #ifndef EXIM_HAVE_ABSTRACT_UNIX_SOCKETS
 144 DEBUG(D_any) debug_printf("unlinking notifier socket %s\n", notifier_socket_name);
 145 Uunlink(notifier_socket_name);
 146 #endif
 147 }
 148
 149
 150 static void
 151 close_daemon_sockets(int daemon_notifier_fd,
 152   struct pollfd * fd_polls, int listen_socket_count)
 153 {
 154 if (daemon_notifier_fd >= 0)
 155   {
 156   (void) close(daemon_notifier_fd);
 157   daemon_notifier_fd = -1;
 158   }
 159
 160 for (int i = 0; i < listen_socket_count; i++) (void) close(fd_polls[i].fd);
 161 }
 162
 163
 164 /*************************************************
 165 *            Handle a connected SMTP call        *
 166 *************************************************/
 167
 168 /* This function is called when an SMTP connection has been accepted.
 169 If there are too many, give an error message and close down. Otherwise
 170 spin off a sub-process to handle the call. The list of listening sockets
 171 is required so that they can be closed in the sub-process. Take care not to
 172 leak store in this process - reset the stacking pool at the end.
 173
 174 Arguments:
 175   fd_polls        sockets which are listening for incoming calls
 176   listen_socket_count   count of listening sockets
 177   accept_socket         socket of the current accepted call
 178   accepted              socket information about the current call
 179
 180 Returns:            nothing
 181 */
 182
 183 static void
 184 handle_smtp_call(struct pollfd * fd_polls, int listen_socket_count,
 185   int accept_socket, struct sockaddr *accepted)
 186 {
 187 pid_t pid;
 188 union sockaddr_46 interface_sockaddr;
 189 EXIM_SOCKLEN_T ifsize = sizeof(interface_sockaddr);
 190 int dup_accept_socket = -1;
 191 int max_for_this_host = 0;
 192 int save_log_selector = *log_selector;
 193 gstring * whofrom;
 194
 195 rmark reset_point = store_mark();
 196
 197 /* Make the address available in ASCII representation, and also fish out
 198 the remote port. */
 199
 200 sender_host_address = host_ntoa(-1, accepted, NULL, &sender_host_port);
 201 DEBUG(D_any) debug_printf("Connection request from %s port %d\n",
 202   sender_host_address, sender_host_port);
 203
 204 /* Set up the output stream, check the socket has duplicated, and set up the
 205 input stream. These operations fail only the exceptional circumstances. Note
 206 that never_error() won't use smtp_out if it is NULL. */
 207
 208 if (!(smtp_out = fdopen(accept_socket, "wb")))
 209   {
 210   never_error(US"daemon: fdopen() for smtp_out failed", US"", errno);
 211   goto ERROR_RETURN;
 212   }
 213
 214 if ((dup_accept_socket = dup(accept_socket)) < 0)
 215   {
 216   never_error(US"daemon: couldn't dup socket descriptor",
 217     US"Connection setup failed", errno);
 218   goto ERROR_RETURN;
 219   }
 220
 221 if (!(smtp_in = fdopen(dup_accept_socket, "rb")))
 222   {
 223   never_error(US"daemon: fdopen() for smtp_in failed",
 224     US"Connection setup failed", errno);
 225   goto ERROR_RETURN;
 226   }
 227
 228 /* Get the data for the local interface address. Panic for most errors, but
 229 "connection reset by peer" just means the connection went away. */
 230
 231 if (getsockname(accept_socket, (struct sockaddr *)(&interface_sockaddr),
 232      &ifsize) < 0)
 233   {
 234   log_write(0, LOG_MAIN | ((errno == ECONNRESET)? 0 : LOG_PANIC),
 235     "getsockname() failed: %s", strerror(errno));
 236   smtp_printf("421 Local problem: getsockname() failed; please try again later\r\n", SP_NO_MORE);
 237   goto ERROR_RETURN;
 238   }
 239
 240 interface_address = host_ntoa(-1, &interface_sockaddr, NULL, &interface_port);
 241 DEBUG(D_interface) debug_printf("interface address=%s port=%d\n",
 242   interface_address, interface_port);
 243
 244 /* Build a string identifying the remote host and, if requested, the port and
 245 the local interface data. This is for logging; at the end of this function the
 246 memory is reclaimed. */
 247
 248 whofrom = string_append(NULL, 3, "[", sender_host_address, "]");
 249
 250 if (LOGGING(incoming_port))
 251   whofrom = string_fmt_append(whofrom, ":%d", sender_host_port);
 252
 253 if (LOGGING(incoming_interface))
 254   whofrom = string_fmt_append(whofrom, " I=[%s]:%d",
 255     interface_address, interface_port);
 256
 257 /* Check maximum number of connections. We do not check for reserved
 258 connections or unacceptable hosts here. That is done in the subprocess because
 259 it might take some time. */
 260
 261 if (smtp_accept_max > 0 && smtp_accept_count >= smtp_accept_max)
 262   {
 263   DEBUG(D_any) debug_printf("rejecting SMTP connection: count=%d max=%d\n",
 264     smtp_accept_count, smtp_accept_max);
 265   smtp_printf("421 Too many concurrent SMTP connections; "
 266     "please try again later.\r\n", SP_NO_MORE);
 267   log_write(L_connection_reject,
 268             LOG_MAIN, "Connection from %Y refused: too many connections",
 269     whofrom);
 270   goto ERROR_RETURN;
 271   }
 272
 273 /* If a load limit above which only reserved hosts are acceptable is defined,
 274 get the load average here, and if there are in fact no reserved hosts, do
 275 the test right away (saves a fork). If there are hosts, do the check in the
 276 subprocess because it might take time. */
 277
 278 if (smtp_load_reserve >= 0)
 279   {
 280   load_average = OS_GETLOADAVG();
 281   if (!smtp_reserve_hosts && load_average > smtp_load_reserve)
 282     {
 283     DEBUG(D_any) debug_printf("rejecting SMTP connection: load average = %.2f\n",
 284       (double)load_average/1000.0);
 285     smtp_printf("421 Too much load; please try again later.\r\n", SP_NO_MORE);
 286     log_write(L_connection_reject,
 287               LOG_MAIN, "Connection from %Y refused: load average = %.2f",
 288       whofrom, (double)load_average/1000.0);
 289     goto ERROR_RETURN;
 290     }
 291   }
 292
 293 /* Check that one specific host (strictly, IP address) is not hogging
 294 resources. This is done here to prevent a denial of service attack by someone
 295 forcing you to fork lots of times before denying service. The value of
 296 smtp_accept_max_per_host is a string which is expanded. This makes it possible
 297 to provide host-specific limits according to $sender_host address, but because
 298 this is in the daemon mainline, only fast expansions (such as inline address
 299 checks) should be used. The documentation is full of warnings. */
 300
 301 GET_OPTION("smtp_accept_max_per_host");
 302 if (smtp_accept_max_per_host)
 303   {
 304   uschar * expanded = expand_string(smtp_accept_max_per_host);
 305   if (!expanded)
 306     {
 307     if (!f.expand_string_forcedfail)
 308       log_write(0, LOG_MAIN|LOG_PANIC, "expansion of smtp_accept_max_per_host "
 309         "failed for %Y: %s", whofrom, expand_string_message);
 310     }
 311   /* For speed, interpret a decimal number inline here */
 312   else
 313     {
 314     uschar * s = expanded;
 315     while (isdigit(*s))
 316       max_for_this_host = max_for_this_host * 10 + *s++ - '0';
 317     if (*s)
 318       log_write(0, LOG_MAIN|LOG_PANIC, "expansion of smtp_accept_max_per_host "
 319         "for %Y contains non-digit: %s", whofrom, expanded);
 320     }
 321   }
 322
 323 /* If we have fewer total connections than max_for_this_host, we can skip the
 324 tedious per host_address checks. Note that at this stage smtp_accept_count
 325 contains the count of *other* connections, not including this one. */
 326
 327 if (  smtp_slots
 328    && max_for_this_host > 0 && smtp_accept_count >= max_for_this_host)
 329   {
 330   int host_accept_count = 0;
 331   int other_host_count = 0;    /* keep a count of non matches to optimise */
 332
 333   for (int i = 0; i < smtp_accept_max; ++i)
 334     if (smtp_slots[i].host_address)
 335       {
 336       if (Ustrcmp(sender_host_address, smtp_slots[i].host_address) == 0)
 337        host_accept_count++;
 338       else
 339        other_host_count++;
 340
 341       /* Testing all these strings is expensive - see if we can drop out
 342       early, either by hitting the target, or finding there are not enough
 343       connections left to make the target. */
 344
 345       if (  host_accept_count >= max_for_this_host
 346          || smtp_accept_count - other_host_count < max_for_this_host)
 347        break;
 348       }
 349
 350   if (host_accept_count >= max_for_this_host)
 351     {
 352     DEBUG(D_any) debug_printf("rejecting SMTP connection: too many from this "
 353       "IP address: count=%d max=%d\n",
 354       host_accept_count, max_for_this_host);
 355     smtp_printf("421 Too many concurrent SMTP connections "
 356       "from this IP address; please try again later.\r\n", SP_NO_MORE);
 357     log_write(L_connection_reject,
 358               LOG_MAIN, "Connection from %Y refused: too many connections "
 359       "from that IP address", whofrom);
 360     search_tidyup();
 361     goto ERROR_RETURN;
 362     }
 363   }
 364
 365 /* OK, the connection count checks have been passed.
 366 Now we can fork the accepting process; do a lookup tidy, just in case any
 367 expansion above did a lookup. */
 368
 369 search_tidyup();
 370 pid = exim_fork(US"daemon-accept");
 371
 372 /* Handle the child process */
 373
 374 if (pid == 0)
 375   {
 376   int queue_only_reason = 0;
 377   int old_pool = store_pool;
 378   int save_debug_selector = debug_selector;
 379   BOOL local_queue_only;
 380   BOOL session_local_queue_only;
 381 #ifdef SA_NOCLDWAIT
 382   struct sigaction act;
 383 #endif
 384
 385   smtp_accept_count++;    /* So that it includes this process */
 386   set_connection_id();
 387
 388   /* Log the connection if requested.
 389   In order to minimize the cost (because this is going to happen for every
 390   connection), do a preliminary selector test here. This saves ploughing through
 391   the generalized logging code each time when the selector is false. If the
 392   selector is set, check whether the host is on the list for logging. If not,
 393   arrange to unset the selector in the subprocess.
 394
 395   jgh 2023/08/08 :- moved this logging in from the parent process, just
 396   pre-fork.  There was a claim back from 4.21 (when it was moved from
 397   smtp_start_session()) that smtp_accept_count could have become out-of-date by
 398   the time the child could log it, and I can't see how that could happen. */
 399
 400   if (LOGGING(smtp_connection))
 401     {
 402     uschar * list = hosts_connection_nolog;
 403     memset(sender_host_cache, 0, sizeof(sender_host_cache));
 404     if (list && verify_check_host(&list) == OK)
 405       save_log_selector &= ~L_smtp_connection;
 406     else if (LOGGING(connection_id))
 407       log_write(L_smtp_connection, LOG_MAIN, "SMTP connection from %Y "
 408         "Ci=%s (TCP/IP connection count = %d)",
 409         whofrom, connection_id, smtp_accept_count);
 410     else
 411       log_write(L_smtp_connection, LOG_MAIN, "SMTP connection from %Y "
 412         "(TCP/IP connection count = %d)", whofrom, smtp_accept_count);
 413     }
 414
 415   /* If the listen backlog was over the monitoring level, log it. */
 416
 417   if (smtp_listen_backlog > smtp_backlog_monitor)
 418     log_write(0, LOG_MAIN, "listen backlog %d I=[%s]:%d",
 419                 smtp_listen_backlog, interface_address, interface_port);
 420
 421   /* May have been modified for the subprocess */
 422
 423   *log_selector = save_log_selector;
 424
 425   /* Get the local interface address into permanent store */
 426
 427   store_pool = POOL_PERM;
 428   interface_address = string_copy(interface_address);
 429   store_pool = old_pool;
 430
 431   /* Check for a tls-on-connect port */
 432
 433   if (host_is_tls_on_connect_port(interface_port)) tls_in.on_connect = TRUE;
 434
 435   /* Expand smtp_active_hostname if required. We do not do this any earlier,
 436   because it may depend on the local interface address (indeed, that is most
 437   likely what it depends on.) */
 438
 439   smtp_active_hostname = primary_hostname;
 440   GET_OPTION("smtp_active_hostname");
 441   if (raw_active_hostname)
 442     {
 443     uschar * nah = expand_string(raw_active_hostname);
 444     if (!nah)
 445       {
 446       if (!f.expand_string_forcedfail)
 447         {
 448         log_write(0, LOG_MAIN|LOG_PANIC, "failed to expand \"%s\" "
 449           "(smtp_active_hostname): %s", raw_active_hostname,
 450           expand_string_message);
 451         smtp_printf("421 Local configuration error; "
 452           "please try again later.\r\n", SP_NO_MORE);
 453         mac_smtp_fflush();
 454         search_tidyup();
 455         exim_underbar_exit(EXIT_FAILURE);
 456         }
 457       }
 458     else if (*nah) smtp_active_hostname = nah;
 459     }
 460
 461   /* Initialize the queueing flags */
 462
 463   queue_check_only();
 464   session_local_queue_only = queue_only;
 465
 466   /* Close the listening sockets, and set the SIGCHLD handler to SIG_IGN.
 467   We also attempt to set things up so that children are automatically reaped,
 468   but just in case this isn't available, there's a paranoid waitpid() in the
 469   loop too (except for systems where we are sure it isn't needed). See the more
 470   extensive comment before the reception loop in exim.c for a fuller
 471   explanation of this logic. */
 472
 473   close_daemon_sockets(daemon_notifier_fd, fd_polls, listen_socket_count);
 474
 475   /* Set FD_CLOEXEC on the SMTP socket. We don't want any rogue child processes
 476   to be able to communicate with them, under any circumstances. */
 477   (void)fcntl(accept_socket, F_SETFD,
 478               fcntl(accept_socket, F_GETFD) | FD_CLOEXEC);
 479   (void)fcntl(dup_accept_socket, F_SETFD,
 480               fcntl(dup_accept_socket, F_GETFD) | FD_CLOEXEC);
 481
 482 #ifdef SA_NOCLDWAIT
 483   act.sa_handler = SIG_IGN;
 484   sigemptyset(&(act.sa_mask));
 485   act.sa_flags = SA_NOCLDWAIT;
 486   sigaction(SIGCHLD, &act, NULL);
 487 #else
 488   signal(SIGCHLD, SIG_IGN);
 489 #endif
 490   signal(SIGTERM, SIG_DFL);
 491   signal(SIGINT, SIG_DFL);
 492
 493   /* Attempt to get an id from the sending machine via the RFC 1413
 494   protocol. We do this in the sub-process in order not to hold up the
 495   main process if there is any delay. Then set up the fullhost information
 496   in case there is no HELO/EHLO.
 497
 498   If debugging is enabled only for the daemon, we must turn if off while
 499   finding the id, but turn it on again afterwards so that information about the
 500   incoming connection is output. */
 501
 502   if (f.debug_daemon) debug_selector = 0;
 503   verify_get_ident(IDENT_PORT);
 504   host_build_sender_fullhost();
 505   debug_selector = save_debug_selector;
 506
 507   DEBUG(D_any)
 508     debug_printf("Process %d is handling incoming connection from %s\n",
 509       (int)getpid(), sender_fullhost);
 510
 511   /* Now disable debugging permanently if it's required only for the daemon
 512   process. */
 513
 514   if (f.debug_daemon) debug_selector = 0;
 515
 516   /* If there are too many child processes for immediate delivery,
 517   set the session_local_queue_only flag, which is initialized from the
 518   configured value and may therefore already be TRUE. Leave logging
 519   till later so it will have a message id attached. Note that there is no
 520   possibility of re-calculating this per-message, because the value of
 521   smtp_accept_count does not change in this subprocess. */
 522
 523   if (smtp_accept_queue > 0 && smtp_accept_count > smtp_accept_queue)
 524     {
 525     session_local_queue_only = TRUE;
 526     queue_only_reason = 1;
 527     }
 528
 529   /* Handle the start of the SMTP session, then loop, accepting incoming
 530   messages from the SMTP connection. The end will come at the QUIT command,
 531   when smtp_setup_msg() returns 0. A break in the connection causes the
 532   process to die (see accept.c).
 533
 534   NOTE: We do *not* call smtp_log_no_mail() if smtp_start_session() fails,
 535   because a log line has already been written for all its failure exists
 536   (usually "connection refused: <reason>") and writing another one is
 537   unnecessary clutter. */
 538
 539   if (!smtp_start_session())
 540     {
 541     mac_smtp_fflush();
 542     search_tidyup();
 543     exim_underbar_exit(EXIT_SUCCESS);
 544     }
 545
 546   for (;;)
 547     {
 548     int rc;
 549     message_id[0] = 0;            /* Clear out any previous message_id */
 550     reset_point = store_mark();   /* Save current store high water point */
 551
 552     DEBUG(D_any)
 553       debug_printf("Process %d is ready for new message\n", (int)getpid());
 554
 555     /* Smtp_setup_msg() returns 0 on QUIT or if the call is from an
 556     unacceptable host or if an ACL "drop" command was triggered, -1 on
 557     connection lost, and +1 on validly reaching DATA. Receive_msg() almost
 558     always returns TRUE when smtp_input is true; just retry if no message was
 559     accepted (can happen for invalid message parameters). However, it can yield
 560     FALSE if the connection was forcibly dropped by the DATA ACL. */
 561
 562     if ((rc = smtp_setup_msg()) > 0)
 563       {
 564       BOOL ok = receive_msg(FALSE);
 565       search_tidyup();                    /* Close cached databases */
 566       if (!ok)                            /* Connection was dropped */
 567         {
 568         cancel_cutthrough_connection(TRUE, US"receive dropped");
 569         mac_smtp_fflush();
 570         smtp_log_no_mail();               /* Log no mail if configured */
 571         exim_underbar_exit(EXIT_SUCCESS);
 572         }
 573       if (!message_id[0]) continue;     /* No message was accepted */
 574       }
 575     else                                /* bad smtp_setup_msg() */
 576       {
 577       if (smtp_out)
 578         {
 579         int fd = fileno(smtp_in);
 580         uschar buf[128];
 581
 582         mac_smtp_fflush();
 583         /* drain socket, for clean TCP FINs */
 584         if (fcntl(fd, F_SETFL, O_NONBLOCK) == 0)
 585           for(int i = 16; read(fd, buf, sizeof(buf)) > 0 && i > 0; ) i--;
 586         }
 587       cancel_cutthrough_connection(TRUE, US"message setup dropped");
 588       search_tidyup();
 589       smtp_log_no_mail();                 /* Log no mail if configured */
 590
 591       /*XXX should we pause briefly, hoping that the client will be the
 592       active TCP closer hence get the TCP_WAIT endpoint? */
 593       DEBUG(D_receive) debug_printf("SMTP>>(close on process exit)\n");
 594       exim_underbar_exit(rc ? EXIT_FAILURE : EXIT_SUCCESS);
 595       }
 596
 597     /* Show the recipients when debugging */
 598
 599     DEBUG(D_receive)
 600       {
 601       if (sender_address)
 602         debug_printf("Sender: %s\n", sender_address);
 603       if (recipients_list)
 604         {
 605         debug_printf("Recipients:\n");
 606         for (int i = 0; i < recipients_count; i++)
 607           debug_printf("  %s\n", recipients_list[i].address);
 608         }
 609       }
 610
 611     /* A message has been accepted. Clean up any previous delivery processes
 612     that have completed and are defunct, on systems where they don't go away
 613     by themselves (see comments when setting SIG_IGN above). On such systems
 614     (if any) these delivery processes hang around after termination until
 615     the next message is received. */
 616
 617     #ifndef SIG_IGN_WORKS
 618     while (waitpid(-1, NULL, WNOHANG) > 0);
 619     #endif
 620
 621     /* Reclaim up the store used in accepting this message */
 622
 623       {
 624       int r = receive_messagecount;
 625       BOOL q = f.queue_only_policy;
 626       smtp_reset(reset_point);
 627       reset_point = NULL;
 628       f.queue_only_policy = q;
 629       receive_messagecount = r;
 630       }
 631
 632     /* If queue_only is set or if there are too many incoming connections in
 633     existence, session_local_queue_only will be TRUE. If it is not, check
 634     whether we have received too many messages in this session for immediate
 635     delivery. */
 636
 637     if (!session_local_queue_only &&
 638         smtp_accept_queue_per_connection > 0 &&
 639         receive_messagecount > smtp_accept_queue_per_connection)
 640       {
 641       session_local_queue_only = TRUE;
 642       queue_only_reason = 2;
 643       }
 644
 645     /* Initialize local_queue_only from session_local_queue_only. If it is not
 646     true, and queue_only_load is set, check that the load average is below it.
 647     If local_queue_only is set by this means, we also set if for the session if
 648     queue_only_load_latch is true (the default). This means that, once set,
 649     local_queue_only remains set for any subsequent messages on the same SMTP
 650     connection. This is a deliberate choice; even though the load average may
 651     fall, it doesn't seem right to deliver later messages on the same call when
 652     not delivering earlier ones. However, the are special circumstances such as
 653     very long-lived connections from scanning appliances where this is not the
 654     best strategy. In such cases, queue_only_load_latch should be set false. */
 655
 656     if (  !(local_queue_only = session_local_queue_only)
 657        && queue_only_load >= 0
 658        && (local_queue_only = (load_average = OS_GETLOADAVG()) > queue_only_load)
 659        )
 660       {
 661       queue_only_reason = 3;
 662       if (queue_only_load_latch) session_local_queue_only = TRUE;
 663       }
 664
 665     /* Log the queueing here, when it will get a message id attached, but
 666     not if queue_only is set (case 0). */
 667
 668     if (local_queue_only) switch(queue_only_reason)
 669       {
 670       case 1: log_write(L_delay_delivery,
 671                 LOG_MAIN, "no immediate delivery: too many connections "
 672                 "(%d, max %d)", smtp_accept_count, smtp_accept_queue);
 673               break;
 674
 675       case 2: log_write(L_delay_delivery,
 676                 LOG_MAIN, "no immediate delivery: more than %d messages "
 677                 "received in one connection", smtp_accept_queue_per_connection);
 678               break;
 679
 680       case 3: log_write(L_delay_delivery,
 681                 LOG_MAIN, "no immediate delivery: load average %.2f",
 682                 (double)load_average/1000.0);
 683               break;
 684       }
 685
 686     /* If a delivery attempt is required, spin off a new process to handle it.
 687     If we are not root, we have to re-exec exim unless deliveries are being
 688     done unprivileged. */
 689
 690     else if (  (!f.queue_only_policy || f.queue_smtp)
 691             && !f.deliver_freeze)
 692       {
 693       pid_t dpid;
 694
 695       /* We used to flush smtp_out before forking so that buffered data was not
 696       duplicated, but now we want to pipeline the responses for data and quit.
 697       Instead, hard-close the fd underlying smtp_out right after fork to discard
 698       the data buffer. */
 699
 700       if ((dpid = exim_fork(US"daemon-accept-delivery")) == 0)
 701         {
 702         (void)fclose(smtp_in);
 703         (void)close(fileno(smtp_out));
 704         (void)fclose(smtp_out);
 705         smtp_in = smtp_out = NULL;
 706
 707         /* Don't ever molest the parent's SSL connection, but do clean up
 708         the data structures if necessary. */
 709
 710 #ifndef DISABLE_TLS
 711         tls_close(NULL, TLS_NO_SHUTDOWN);
 712 #endif
 713
 714         /* Reset SIGHUP and SIGCHLD in the child in both cases. */
 715
 716         signal(SIGHUP,  SIG_DFL);
 717         signal(SIGCHLD, SIG_DFL);
 718         signal(SIGTERM, SIG_DFL);
 719         signal(SIGINT, SIG_DFL);
 720
 721         if (geteuid() != root_uid && !deliver_drop_privilege)
 722           {
 723           signal(SIGALRM, SIG_DFL);
 724           delivery_re_exec(CEE_EXEC_PANIC);
 725           /* Control does not return here. */
 726           }
 727
 728         /* No need to re-exec; SIGALRM remains set to the default handler */
 729
 730         (void) deliver_message(message_id, FALSE, FALSE);
 731         search_tidyup();
 732         exim_underbar_exit(EXIT_SUCCESS);
 733         }
 734
 735       if (dpid > 0)
 736         {
 737         release_cutthrough_connection(US"passed for delivery");
 738         DEBUG(D_any) debug_printf("forked delivery process %d\n", (int)dpid);
 739         }
 740       else
 741         {
 742         cancel_cutthrough_connection(TRUE, US"delivery fork failed");
 743         log_write(0, LOG_MAIN|LOG_PANIC, "daemon: delivery process fork "
 744           "failed: %s", strerror(errno));
 745         }
 746       }
 747     }
 748   }
 749
 750
 751 /* Carrying on in the parent daemon process... Can't do much if the fork
 752 failed. Otherwise, keep count of the number of accepting processes and
 753 remember the pid for ticking off when the child completes. */
 754
 755 if (pid < 0)
 756   never_error(US"daemon: accept process fork failed", US"Fork failed", errno);
 757 else if (smtp_slots)
 758   {
 759   for (int i = 0; i < smtp_accept_max; ++i)
 760     if (smtp_slots[i].pid <= 0)
 761       {
 762       smtp_slots[i].pid = pid;
 763       /* Connection closes come asyncronously, so we cannot stack this store */
 764       if (smtp_accept_max_per_host)
 765         smtp_slots[i].host_address = string_copy_malloc(sender_host_address);
 766       smtp_accept_count++;
 767       break;
 768       }
 769   DEBUG(D_any) debug_printf("%d SMTP accept process%s running\n",
 770     smtp_accept_count, smtp_accept_count == 1 ? "" : "es");
 771   }
 772
 773 /* Get here via goto in error cases */
 774
 775 ERROR_RETURN:
 776
 777 /* Close the streams associated with the socket which will also close the
 778 socket fds in this process. We can't do anything if fclose() fails, but
 779 logging brings it to someone's attention. However, "connection reset by peer"
 780 isn't really a problem, so skip that one. On Solaris, a dropped connection can
 781 manifest itself as a broken pipe, so drop that one too. If the streams don't
 782 exist, something went wrong while setting things up. Make sure the socket
 783 descriptors are closed, in order to drop the connection. */
 784
 785 if (smtp_out)
 786   {
 787   if (fclose(smtp_out) != 0 && errno != ECONNRESET && errno != EPIPE)
 788     log_write(0, LOG_MAIN|LOG_PANIC, "daemon: fclose(smtp_out) failed: %s",
 789       strerror(errno));
 790   smtp_out = NULL;
 791   }
 792 else (void)close(accept_socket);
 793
 794 if (smtp_in)
 795   {
 796   if (fclose(smtp_in) != 0 && errno != ECONNRESET && errno != EPIPE)
 797     log_write(0, LOG_MAIN|LOG_PANIC, "daemon: fclose(smtp_in) failed: %s",
 798       strerror(errno));
 799   smtp_in = NULL;
 800   }
 801 else (void)close(dup_accept_socket);
 802
 803 /* Release any store used in this process, including the store used for holding
 804 the incoming host address and an expanded active_hostname. */
 805
 806 log_close_all();
 807 interface_address = sender_host_name = sender_host_address = NULL;
 808 store_reset(reset_point);
 809 }
 810
 811
 812
 813
 814 /*************************************************
 815 *       Check wildcard listen special cases      *
 816 *************************************************/
 817
 818 /* This function is used when binding and listening on lists of addresses and
 819 ports. It tests for special cases of wildcard listening, when IPv4 and IPv6
 820 sockets may interact in different ways in different operating systems. It is
 821 passed an error number, the list of listening addresses, and the current
 822 address. Two checks are available: for a previous wildcard IPv6 address, or for
 823 a following wildcard IPv4 address, in both cases on the same port.
 824
 825 In practice, pairs of wildcard addresses should be adjacent in the address list
 826 because they are sorted that way below.
 827
 828 Arguments:
 829   eno            the error number
 830   addresses      the list of addresses
 831   ipa            the current IP address
 832   back           if TRUE, check for previous wildcard IPv6 address
 833                  if FALSE, check for a following wildcard IPv4 address
 834
 835 Returns:         TRUE or FALSE
 836 */
 837
 838 static BOOL
 839 check_special_case(int eno, ip_address_item *addresses, ip_address_item *ipa,
 840   BOOL back)
 841 {
 842 ip_address_item *ipa2;
 843
 844 /* For the "back" case, if the failure was "address in use" for a wildcard IPv4
 845 address, seek a previous IPv6 wildcard address on the same port. As it is
 846 previous, it must have been successfully bound and be listening. Flag it as a
 847 "6 including 4" listener. */
 848
 849 if (back)
 850   {
 851   if (eno != EADDRINUSE || ipa->address[0] != 0) return FALSE;
 852   for (ipa2 = addresses; ipa2 != ipa; ipa2 = ipa2->next)
 853     {
 854     if (ipa2->address[1] == 0 && ipa2->port == ipa->port)
 855       {
 856       ipa2->v6_include_v4 = TRUE;
 857       return TRUE;
 858       }
 859     }
 860   }
 861
 862 /* For the "forward" case, if the current address is a wildcard IPv6 address,
 863 we seek a following wildcard IPv4 address on the same port. */
 864
 865 else
 866   {
 867   if (ipa->address[0] != ':' || ipa->address[1] != 0) return FALSE;
 868   for (ipa2 = ipa->next; ipa2 != NULL; ipa2 = ipa2->next)
 869     if (ipa2->address[0] == 0 && ipa->port == ipa2->port) return TRUE;
 870   }
 871
 872 return FALSE;
 873 }
 874
 875
 876
 877
 878 /*************************************************
 879 *         Handle terminating subprocesses        *
 880 *************************************************/
 881
 882 /* Handle the termination of child processes. Theoretically, this need be done
 883 only when sigchld_seen is TRUE, but rumour has it that some systems lose
 884 SIGCHLD signals at busy times, so to be on the safe side, this function is
 885 called each time round. It shouldn't be too expensive.
 886
 887 Arguments:  none
 888 Returns:    nothing
 889 */
 890
 891 static void
 892 handle_ending_processes(void)
 893 {
 894 int status;
 895 pid_t pid;
 896
 897 while ((pid = waitpid(-1, &status, WNOHANG)) > 0)
 898   {
 899   DEBUG(D_any)
 900     {
 901     debug_printf("child %ld ended: status=0x%x\n", (long)pid, status);
 902 #ifdef WCOREDUMP
 903     if (WIFEXITED(status))
 904       debug_printf("  normal exit, %d\n", WEXITSTATUS(status));
 905     else if (WIFSIGNALED(status))
 906       debug_printf("  signal exit, signal %d%s\n", WTERMSIG(status),
 907           WCOREDUMP(status) ? " (core dumped)" : "");
 908 #endif
 909     }
 910
 911   /* If it's a listening daemon for which we are keeping track of individual
 912   subprocesses, deal with an accepting process that has terminated. */
 913
 914   if (smtp_slots)
 915     {
 916     int i;
 917     smtp_slot * sp;
 918     for (i = 0, sp = smtp_slots; i < smtp_accept_max; i++, sp++)
 919       if (sp->pid == pid)
 920         {
 921         if (sp->host_address)
 922           store_free(sp->host_address);
 923         *sp = empty_smtp_slot;
 924         if (--smtp_accept_count < 0) smtp_accept_count = 0;
 925         DEBUG(D_any) debug_printf("%d SMTP accept process%s now running\n",
 926           smtp_accept_count, smtp_accept_count == 1 ? "" : "es");
 927         break;
 928         }
 929     if (i < smtp_accept_max) continue;  /* Found an accepting process */
 930     }
 931
 932   /* If it wasn't an accepting process, see if it was a queue-runner
 933   process that we are tracking. */
 934
 935   if (queue_runner_slots)
 936     for (unsigned i = 0; i < queue_runner_slot_count; i++)
 937       {
 938       runner_slot * r = queue_runner_slots + i;
 939       if (r->pid == pid)
 940         {
 941         r->pid = 0;                     /* free up the slot */
 942
 943         if (--queue_run_count < 0) queue_run_count = 0;
 944         DEBUG(D_any) debug_printf("%d queue-runner process%s now running\n",
 945           queue_run_count, queue_run_count == 1 ? "" : "es");
 946
 947         for (qrunner ** p = &qrunners, * q = qrunners; q; p = &q->next, q = *p)
 948           if (q->name == r->queue_name)
 949             {
 950             if (q->interval)            /* a periodic queue run */
 951               q->run_count--;
 952             else                        /* a one-time run */
 953               *p = q->next;             /* drop this qrunner */
 954             break;
 955             }
 956         break;
 957         }
 958       }
 959   }
 960 }
 961
 962
 963 static void
 964 set_pid_file_path(void)
 965 {
 966 if (override_pid_file_path)
 967   pid_file_path = override_pid_file_path;
 968
 969 if (!*pid_file_path)
 970   pid_file_path = string_sprintf("%s/exim-daemon.pid", spool_directory);
 971
 972 if (pid_file_path[0] != '/')
 973   log_write(0, LOG_PANIC_DIE, "pid file path %s must be absolute\n", pid_file_path);
 974 }
 975
 976
 977 enum pid_op { PID_WRITE, PID_CHECK, PID_DELETE };
 978
 979 /* Do various pid file operations as safe as possible. Ideally we'd just
 980 drop the privileges for creation of the pid file and not care at all about removal of
 981 the file. FIXME.
 982 Returns: true on success, false + errno==EACCES otherwise
 983 */
 984
 985 static BOOL
 986 operate_on_pid_file(const enum pid_op operation, const pid_t pid)
 987 {
 988 char pid_line[sizeof(int) * 3 + 2];
 989 const int pid_len = snprintf(pid_line, sizeof(pid_line), "%ld\n", (long)pid);
 990 BOOL lines_match = FALSE;
 991 uschar * path, * base, * dir;
 992
 993 const int dir_flags = O_RDONLY | O_NONBLOCK;
 994 const int base_flags = O_NOFOLLOW | O_NONBLOCK;
 995 const mode_t base_mode = 0644;
 996 struct stat sb;
 997 int cwd_fd = -1, dir_fd = -1, base_fd = -1;
 998 BOOL success = FALSE;
 999 errno = EACCES;
1000
1001 set_pid_file_path();
1002 if (!f.running_in_test_harness && real_uid != root_uid && real_uid != exim_uid) goto cleanup;
1003 if (pid_len < 2 || pid_len >= (int)sizeof(pid_line)) goto cleanup;
1004
1005 path = string_copy(pid_file_path);
1006 if ((base = Ustrrchr(path, '/')) == NULL)       /* should not happen, but who knows */
1007   log_write(0, LOG_MAIN|LOG_PANIC_DIE, "pid file path \"%s\" does not contain a '/'", pid_file_path);
1008
1009 dir = base != path ? path : US"/";
1010 *base++ = '\0';
1011
1012 if (!dir || !*dir || *dir != '/') goto cleanup;
1013 if (!base || !*base || Ustrchr(base, '/') != NULL) goto cleanup;
1014
1015 cwd_fd = open(".", dir_flags);
1016 if (cwd_fd < 0 || fstat(cwd_fd, &sb) != 0 || !S_ISDIR(sb.st_mode)) goto cleanup;
1017 dir_fd = open(CS dir, dir_flags);
1018 if (dir_fd < 0 || fstat(dir_fd, &sb) != 0 || !S_ISDIR(sb.st_mode)) goto cleanup;
1019
1020 /* emulate openat */
1021 if (fchdir(dir_fd) != 0) goto cleanup;
1022 base_fd = open(CS base, O_RDONLY | base_flags);
1023 if (fchdir(cwd_fd) != 0)
1024   log_write(0, LOG_MAIN|LOG_PANIC_DIE, "can't return to previous working dir: %s", strerror(errno));
1025
1026 if (base_fd >= 0)
1027   {
1028   char line[sizeof(pid_line)];
1029   ssize_t len = -1;
1030
1031   if (fstat(base_fd, &sb) != 0 || !S_ISREG(sb.st_mode)) goto cleanup;
1032   if ((sb.st_mode & 07777) != base_mode || sb.st_nlink != 1) goto cleanup;
1033   if (sb.st_size < 2 || sb.st_size >= (off_t)sizeof(line)) goto cleanup;
1034
1035   len = read(base_fd, line, sizeof(line));
1036   if (len != (ssize_t)sb.st_size) goto cleanup;
1037   line[len] = '\0';
1038
1039   if (strspn(line, "0123456789") != (size_t)len-1) goto cleanup;
1040   if (line[len-1] != '\n') goto cleanup;
1041   lines_match = len == pid_len && strcmp(line, pid_line) == 0;
1042   }
1043
1044 if (operation == PID_WRITE)
1045   {
1046   if (!lines_match)
1047     {
1048     if (base_fd >= 0)
1049       {
1050       int error = -1;
1051       /* emulate unlinkat */
1052       if (fchdir(dir_fd) != 0) goto cleanup;
1053       error = unlink(CS base);
1054       if (fchdir(cwd_fd) != 0)
1055         log_write(0, LOG_MAIN|LOG_PANIC_DIE, "can't return to previous working dir: %s", strerror(errno));
1056       if (error) goto cleanup;
1057       (void)close(base_fd);
1058       base_fd = -1;
1059      }
1060     /* emulate openat */
1061     if (fchdir(dir_fd) != 0) goto cleanup;
1062     base_fd = open(CS base, O_WRONLY | O_CREAT | O_EXCL | base_flags, base_mode);
1063     if (fchdir(cwd_fd) != 0)
1064         log_write(0, LOG_MAIN|LOG_PANIC_DIE, "can't return to previous working dir: %s", strerror(errno));
1065     if (base_fd < 0) goto cleanup;
1066     if (fchmod(base_fd, base_mode) != 0) goto cleanup;
1067     if (write(base_fd, pid_line, pid_len) != pid_len) goto cleanup;
1068     DEBUG(D_any) debug_printf("pid written to %s\n", pid_file_path);
1069     }
1070   }
1071 else
1072   {
1073   if (!lines_match) goto cleanup;
1074   if (operation == PID_DELETE)
1075     {
1076     int error = -1;
1077     /* emulate unlinkat */
1078     if (fchdir(dir_fd) != 0) goto cleanup;
1079     error = unlink(CS base);
1080     if (fchdir(cwd_fd) != 0)
1081         log_write(0, LOG_MAIN|LOG_PANIC_DIE, "can't return to previous working dir: %s", strerror(errno));
1082     if (error) goto cleanup;
1083     }
1084   }
1085
1086 success = TRUE;
1087 errno = 0;
1088
1089 cleanup:
1090 if (cwd_fd >= 0) (void)close(cwd_fd);
1091 if (dir_fd >= 0) (void)close(dir_fd);
1092 if (base_fd >= 0) (void)close(base_fd);
1093 return success;
1094 }
1095
1096
1097 /* Remove the daemon's pidfile.  Note: runs with root privilege,
1098 as a direct child of the daemon.  Does not return. */
1099
1100 void
1101 delete_pid_file(void)
1102 {
1103 const BOOL success = operate_on_pid_file(PID_DELETE, getppid());
1104
1105 DEBUG(D_any)
1106   debug_printf("delete pid file %s %s: %s\n", pid_file_path,
1107     success ? "success" : "failure", strerror(errno));
1108
1109 exim_exit(EXIT_SUCCESS);
1110 }
1111
1112
1113 /* Called by the daemon; exec a child to get the pid file deleted
1114 since we may require privs for the containing directory */
1115
1116 static void
1117 daemon_die(void)
1118 {
1119 pid_t pid;
1120
1121 DEBUG(D_any) debug_printf("SIGTERM/SIGINT seen\n");
1122 #if !defined(DISABLE_TLS) && (defined(EXIM_HAVE_INOTIFY) || defined(EXIM_HAVE_KEVENT))
1123 tls_watch_invalidate();
1124 #endif
1125
1126 if (daemon_notifier_fd >= 0)
1127   {
1128   close(daemon_notifier_fd);
1129   daemon_notifier_fd = -1;
1130   unlink_notifier_socket();
1131   }
1132
1133 if (f.running_in_test_harness || write_pid)
1134   {
1135   if ((pid = exim_fork(US"daemon-del-pidfile")) == 0)
1136     {
1137     if (override_pid_file_path)
1138       (void)child_exec_exim(CEE_EXEC_PANIC, FALSE, NULL, FALSE, 3,
1139         "-oP", override_pid_file_path, "-oPX");
1140     else
1141       (void)child_exec_exim(CEE_EXEC_PANIC, FALSE, NULL, FALSE, 1, "-oPX");
1142
1143     /* Control never returns here. */
1144     }
1145   if (pid > 0)
1146     child_close(pid, 1);
1147   }
1148 exim_exit(EXIT_SUCCESS);
1149 }
1150
1151
1152 /*************************************************
1153 *       Listener socket for local work prompts   *
1154 *************************************************/
1155
1156 ssize_t
1157 daemon_client_sockname(struct sockaddr_un * sup, uschar ** sname)
1158 {
1159 #ifdef EXIM_HAVE_ABSTRACT_UNIX_SOCKETS
1160 sup->sun_path[0] = 0;  /* Abstract local socket addr - Linux-specific? */
1161 return offsetof(struct sockaddr_un, sun_path) + 1
1162   + snprintf(sup->sun_path+1, sizeof(sup->sun_path)-1, "exim_%d", getpid());
1163 #else
1164 *sname = string_sprintf("%s/p_%d", spool_directory, getpid());
1165 return offsetof(struct sockaddr_un, sun_path)
1166   + snprintf(sup->sun_path, sizeof(sup->sun_path), "%s", CS *sname);
1167 #endif
1168 }
1169
1170 ssize_t
1171 daemon_notifier_sockname(struct sockaddr_un * sup)
1172 {
1173 GET_OPTION("notifier_socket");
1174 #ifdef EXIM_HAVE_ABSTRACT_UNIX_SOCKETS
1175 sup->sun_path[0] = 0;  /* Abstract local socket addr - Linux-specific? */
1176 return offsetof(struct sockaddr_un, sun_path) + 1
1177   + snprintf(sup->sun_path+1, sizeof(sup->sun_path)-1, "%s",
1178               CS expand_string(notifier_socket));
1179 #else
1180 notifier_socket_name = expand_string(notifier_socket);
1181 return offsetof(struct sockaddr_un, sun_path)
1182   + snprintf(sup->sun_path, sizeof(sup->sun_path), "%s",
1183               CS notifier_socket_name);
1184 #endif
1185 }
1186
1187
1188 static void
1189 daemon_notifier_socket(void)
1190 {
1191 int fd;
1192 const uschar * where;
1193 struct sockaddr_un sa_un = {.sun_family = AF_UNIX};
1194 ssize_t len;
1195
1196 if (!f.notifier_socket_en)
1197   {
1198   DEBUG(D_any) debug_printf("-oY used so not creating notifier socket\n");
1199   return;
1200   }
1201 if (override_local_interfaces && !override_pid_file_path)
1202   {
1203   DEBUG(D_any)
1204     debug_printf("-oX used without -oP so not creating notifier socket\n");
1205   return;
1206   }
1207 if (!notifier_socket || !*notifier_socket)
1208   {
1209   DEBUG(D_any) debug_printf("no name for notifier socket\n");
1210   return;
1211   }
1212
1213 DEBUG(D_any) debug_printf("creating notifier socket\n");
1214
1215 #ifdef SOCK_CLOEXEC
1216 if ((fd = socket(PF_UNIX, SOCK_DGRAM|SOCK_CLOEXEC, 0)) < 0)
1217   { where = US"socket"; goto bad; }
1218 #else
1219 if ((fd = socket(PF_UNIX, SOCK_DGRAM, 0)) < 0)
1220   { where = US"socket"; goto bad; }
1221 (void)fcntl(fd, F_SETFD, fcntl(fd, F_GETFD) | FD_CLOEXEC);
1222 #endif
1223
1224 len = daemon_notifier_sockname(&sa_un);
1225
1226 #ifdef EXIM_HAVE_ABSTRACT_UNIX_SOCKETS
1227 DEBUG(D_any) debug_printf(" @%s\n", sa_un.sun_path+1);
1228 #else                   /* filesystem-visible and persistent; will neeed removal */
1229 DEBUG(D_any) debug_printf(" %s\n", sa_un.sun_path);
1230 #endif
1231
1232 if (bind(fd, (const struct sockaddr *)&sa_un, (socklen_t)len) < 0)
1233   { where = US"bind"; goto bad; }
1234
1235 #ifdef SO_PASSCRED              /* Linux */
1236 if (setsockopt(fd, SOL_SOCKET, SO_PASSCRED, &on, sizeof(on)) < 0)
1237   { where = US"SO_PASSCRED"; goto bad2; }
1238 #elif defined(LOCAL_CREDS)      /* FreeBSD-ish */
1239 if (setsockopt(fd, 0, LOCAL_CREDS, &on, sizeof(on)) < 0)
1240   { where = US"LOCAL_CREDS"; goto bad2; }
1241 #endif
1242
1243 /* debug_printf("%s: fd %d\n", __FUNCTION__, fd); */
1244 daemon_notifier_fd = fd;
1245 return;
1246
1247 bad2:
1248 #ifndef EXIM_HAVE_ABSTRACT_UNIX_SOCKETS
1249   Uunlink(sa_un.sun_path);
1250 #endif
1251 bad:
1252   log_write(0, LOG_MAIN|LOG_PANIC, "%s %s: %s",
1253     __FUNCTION__, where, strerror(errno));
1254   close(fd);
1255   return;
1256 }
1257
1258
1259 /* Data for notifier-triggered queue runs */
1260
1261 static uschar queuerun_msgid[MESSAGE_ID_LENGTH+1];
1262 static const uschar * queuerun_msg_qname;
1263
1264
1265 /* The notifier socket has something to read. Pull the message from it, decode
1266 and do the action.
1267 */
1268
1269 static void
1270 daemon_notification(void)
1271 {
1272 uschar buf[256], cbuf[256];
1273 struct sockaddr_un sa_un;
1274 struct iovec iov = {.iov_base = buf, .iov_len = sizeof(buf)-1};
1275 struct msghdr msg = { .msg_name = &sa_un,
1276                       .msg_namelen = sizeof(sa_un),
1277                       .msg_iov = &iov,
1278                       .msg_iovlen = 1,
1279                       .msg_control = cbuf,
1280                       .msg_controllen = sizeof(cbuf)
1281                     };
1282 ssize_t sz;
1283
1284 buf[sizeof(buf)-1] = 0;
1285 if ((sz = recvmsg(daemon_notifier_fd, &msg, 0)) <= 0) return;
1286 if (sz >= sizeof(buf)) return;
1287
1288 #ifdef notdef
1289 debug_printf("addrlen %d\n", msg.msg_namelen);
1290 #endif
1291 DEBUG(D_queue_run)
1292   if (msg.msg_namelen > 0)
1293     {
1294     BOOL abstract = !*sa_un.sun_path;
1295     char * name = sa_un.sun_path + (abstract ? 1 : 0);
1296     int namelen =  (int)msg.msg_namelen - abstract ? 1 : 0;
1297     if (*name)
1298       debug_printf("%s from addr '%s%.*s'\n", __FUNCTION__,
1299         abstract ? "@" : "",
1300         namelen, name);
1301     else
1302       debug_printf("%s (from unknown addr)\n", __FUNCTION__);
1303     }
1304   else
1305     debug_printf("%s (from unknown addr)\n", __FUNCTION__);
1306
1307 /* Refuse to handle the item unless the peer has good credentials */
1308 #ifdef SCM_CREDENTIALS
1309 # define EXIM_SCM_CR_TYPE SCM_CREDENTIALS
1310 #elif defined(LOCAL_CREDS) && defined(SCM_CREDS)
1311 # define EXIM_SCM_CR_TYPE SCM_CREDS
1312 #else
1313         /* The OS has no way to get the creds of the caller (for a unix/datagram socket.
1314         Punt; don't try to check. */
1315 #endif
1316
1317 #ifdef EXIM_SCM_CR_TYPE
1318 for (struct cmsghdr * cp = CMSG_FIRSTHDR(&msg);
1319      cp;
1320      cp = CMSG_NXTHDR(&msg, cp))
1321   if (cp->cmsg_level == SOL_SOCKET && cp->cmsg_type == EXIM_SCM_CR_TYPE)
1322   {
1323 # ifdef SCM_CREDENTIALS                                 /* Linux */
1324   struct ucred * cr = (struct ucred *) CMSG_DATA(cp);
1325   if (cr->uid && cr->uid != exim_uid)
1326     {
1327     DEBUG(D_queue_run) debug_printf("%s: sender creds pid %ld uid %d gid %d\n",
1328       __FUNCTION__, (long)cr->pid, (int)cr->uid, (int)cr->gid);
1329     }
1330 # elif defined(LOCAL_CREDS)                             /* BSD-ish */
1331   struct sockcred * cr = (struct sockcred *) CMSG_DATA(cp);
1332   if (cr->sc_uid && cr->sc_uid != exim_uid)
1333     {
1334     DEBUG(D_queue_run) debug_printf("%s: sender creds pid ??? uid %d gid %d\n",
1335       __FUNCTION__, (int)cr->sc_uid, (int)cr->sc_gid);
1336     }
1337 # endif
1338   break;
1339   }
1340 #endif
1341
1342 buf[sz] = 0;
1343 switch (buf[0])
1344   {
1345 #ifndef DISABLE_QUEUE_RAMP
1346   case NOTIFY_MSG_QRUN:
1347     /* this should be a message_id */
1348     DEBUG(D_queue_run)
1349       debug_printf("%s: qrunner trigger: %s\n", __FUNCTION__, buf+1);
1350
1351     memcpy(queuerun_msgid, buf+1, MESSAGE_ID_LENGTH+1);
1352
1353     for (qrunner * q = qrunners; q; q = q->next)
1354       if (q->name
1355           ? Ustrcmp(q->name, buf+1+MESSAGE_ID_LENGTH+1) == 0
1356           : !buf[1+MESSAGE_ID_LENGTH+1]
1357          )
1358         { queuerun_msg_qname = q->name; break; }
1359     return;
1360 #endif
1361
1362   case NOTIFY_QUEUE_SIZE_REQ:
1363     {
1364     uschar buf[16];
1365     int len = snprintf(CS buf, sizeof(buf), "%u", queue_count_cached());
1366
1367     DEBUG(D_queue_run)
1368       debug_printf("%s: queue size request: %s\n", __FUNCTION__, buf);
1369
1370     if (sendto(daemon_notifier_fd, buf, len, 0,
1371                 (const struct sockaddr *)&sa_un, msg.msg_namelen) < 0)
1372       log_write(0, LOG_MAIN|LOG_PANIC,
1373         "%s: sendto: %s\n", __FUNCTION__, strerror(errno));
1374     break;
1375     }
1376
1377   case NOTIFY_REGEX:
1378     regex_at_daemon(buf);
1379     break;
1380   }
1381 return;
1382 }
1383
1384
1385
1386 static void
1387 daemon_inetd_wtimeout(time_t last_connection_time)
1388 {
1389 time_t resignal_interval = inetd_wait_timeout;
1390
1391 if (last_connection_time == (time_t)0)
1392   {
1393   DEBUG(D_any)
1394     debug_printf("inetd wait timeout expired, but still not seen first message, ignoring\n");
1395   }
1396 else
1397   {
1398   time_t now = time(NULL);
1399   if (now == (time_t)-1)
1400     {
1401     DEBUG(D_any) debug_printf("failed to get time: %s\n", strerror(errno));
1402     }
1403   else if ((now - last_connection_time) >= inetd_wait_timeout)
1404     {
1405     DEBUG(D_any)
1406       debug_printf("inetd wait timeout %d expired, ending daemon\n",
1407           inetd_wait_timeout);
1408     log_write(0, LOG_MAIN, "exim %s daemon terminating, inetd wait timeout reached.\n",
1409         version_string);
1410     daemon_die();               /* Does not return */
1411     }
1412   else
1413     resignal_interval -= (now - last_connection_time);
1414   }
1415
1416 sigalrm_seen = FALSE;
1417 ALARM(resignal_interval);
1418 }
1419
1420
1421 /* Re-sort the qrunners list, and return the shortest interval.
1422 That could be negatime.
1423 The next-tick times should have been updated by any runs initiated,
1424 though will not be when the global limit on runners was reached.
1425
1426 Unlikely to have many queues, so insertion-sort.
1427 */
1428
1429 static int
1430 next_qrunner_interval(void)
1431 {
1432 qrunner * sorted = NULL;
1433 for (qrunner * q = qrunners, * next; q; q = next)
1434   {
1435   next = q->next;
1436   q->next = NULL;
1437   if (sorted)
1438     {
1439     qrunner ** p = &sorted;
1440     for (qrunner * qq; qq = *p; p = &qq->next)
1441       if (  q->next_tick < qq->next_tick
1442          || q->next_tick == qq->next_tick && q->interval < qq->interval
1443          )
1444         {
1445         *p = q;
1446         q->next = qq;
1447         goto INSERTED;
1448         }
1449     *p = q;
1450   INSERTED: ;
1451     }
1452   else
1453     sorted = q;
1454   }
1455 qrunners = sorted;
1456 return qrunners ? qrunners->next_tick - time(NULL) : 0;
1457 }
1458
1459 /* See if we can do a queue run.  If policy limit permit, kick one off.
1460 If both notification and timer events are present, handle the former
1461 and leave the timer outstanding.
1462
1463 Return the number of seconds until the next due runner.
1464 */
1465
1466 static int
1467 daemon_qrun(int local_queue_run_max, struct pollfd * fd_polls, int listen_socket_count)
1468 {
1469 DEBUG(D_any) debug_printf("%s received\n",
1470 #ifndef DISABLE_QUEUE_RAMP
1471   *queuerun_msgid ? "qrun notification" :
1472 #endif
1473   "SIGALRM");
1474
1475 /* Do a full queue run in a child process, if required, unless we already have
1476 enough queue runners on the go. If we are not running as root, a re-exec is
1477 required. In the calling process, restart the alamr timer for the next run.  */
1478
1479 if (is_multiple_qrun())                         /* we are managing periodic runs */
1480   if (local_queue_run_max <= 0 || queue_run_count < local_queue_run_max)
1481     {
1482     qrunner * q = NULL;
1483
1484 #ifndef DISABLE_QUEUE_RAMP
1485     /* If this is a triggered run for a specific message, see if we can start
1486     another runner for this queue. */
1487
1488     if (*queuerun_msgid)
1489       {
1490       for (qrunner * qq = qrunners; qq; qq = qq->next)
1491         if (qq->name == queuerun_msg_qname)
1492           {
1493           q = qq->run_count < qq->run_max ? qq : NULL;
1494           break;
1495           }
1496       }
1497     else
1498 #endif
1499       /* Normal periodic run: in order of run priority, find the first queue
1500       for which we can start a runner */
1501
1502       for (q = qrunners; q; q = q->next)
1503         if (q->run_count < q->run_max) break;
1504
1505     if (q)                                      /* found a queue to run */
1506       {
1507       pid_t pid;
1508
1509       /* Bump this queue's next-tick by it's interval */
1510
1511       if (q->interval)
1512         {
1513         time_t now = time(NULL);
1514         do ; while ((q->next_tick += q->interval) <= now);
1515         }
1516
1517       if ((pid = exim_fork(US"queue-runner")) == 0)
1518         {
1519         /* Disable debugging if it's required only for the daemon process. We
1520         leave the above message, because it ties up with the "child ended"
1521         debugging messages. */
1522
1523         if (f.debug_daemon) debug_selector = 0;
1524
1525         /* Close any open listening sockets in the child */
1526
1527         close_daemon_sockets(daemon_notifier_fd,
1528           fd_polls, listen_socket_count);
1529
1530         /* Reset SIGHUP and SIGCHLD in the child in both cases. */
1531
1532         signal(SIGHUP,  SIG_DFL);
1533         signal(SIGCHLD, SIG_DFL);
1534         signal(SIGTERM, SIG_DFL);
1535         signal(SIGINT, SIG_DFL);
1536
1537         /* Re-exec if privilege has been given up, unless deliver_drop_
1538         privilege is set. Reset SIGALRM before exec(). */
1539
1540         if (geteuid() != root_uid && !deliver_drop_privilege)
1541           {
1542           uschar opt[8];
1543           uschar *p = opt;
1544           uschar *extra[7];
1545           int extracount = 1;
1546
1547           signal(SIGALRM, SIG_DFL);
1548           queue_name = US"";
1549
1550           *p++ = '-';
1551           *p++ = 'q';
1552           if (  q->queue_2stage
1553 #ifndef DISABLE_QUEUE_RAMP
1554              && !*queuerun_msgid
1555 #endif
1556              ) *p++ = 'q';
1557           if (q->queue_run_first_delivery) *p++ = 'i';
1558           if (q->queue_run_force) *p++ = 'f';
1559           if (q->deliver_force_thaw) *p++ = 'f';
1560           if (q->queue_run_local) *p++ = 'l';
1561           *p = 0;
1562
1563           extra[0] = q->name
1564             ? string_sprintf("%sG%s", opt, q->name) : opt;
1565
1566 #ifndef DISABLE_QUEUE_RAMP
1567           if (*queuerun_msgid)
1568             {
1569             log_write(0, LOG_MAIN, "notify triggered queue run");
1570             extra[extracount++] = queuerun_msgid;       /* Trigger only the */
1571             extra[extracount++] = queuerun_msgid;       /* one message      */
1572             }
1573 #endif
1574
1575           /* If -R or -S were on the original command line, ensure they get
1576           passed on. */
1577
1578           if (deliver_selectstring)
1579             {
1580             extra[extracount++] = f.deliver_selectstring_regex ? US"-Rr" : US"-R";
1581             extra[extracount++] = deliver_selectstring;
1582             }
1583
1584           if (deliver_selectstring_sender)
1585             {
1586             extra[extracount++] = f.deliver_selectstring_sender_regex
1587               ? US"-Sr" : US"-S";
1588             extra[extracount++] = deliver_selectstring_sender;
1589             }
1590
1591           /* Overlay this process with a new execution. */
1592
1593           (void)child_exec_exim(CEE_EXEC_PANIC, FALSE, NULL, FALSE, extracount,
1594             extra[0], extra[1], extra[2], extra[3], extra[4], extra[5], extra[6]);
1595
1596           /* Control never returns here. */
1597           }
1598
1599         /* No need to re-exec; SIGALRM remains set to the default handler */
1600
1601 #ifndef DISABLE_QUEUE_RAMP
1602         if (*queuerun_msgid)
1603           {
1604           log_write(0, LOG_MAIN, "notify triggered queue run");
1605           f.queue_2stage = FALSE;
1606           queue_run(q, queuerun_msgid, queuerun_msgid, FALSE);
1607           }
1608         else
1609 #endif
1610           queue_run(q, NULL, NULL, FALSE);
1611         exim_underbar_exit(EXIT_SUCCESS);
1612         }
1613
1614       if (pid < 0)
1615         {
1616         log_write(0, LOG_MAIN|LOG_PANIC, "daemon: fork of queue-runner "
1617           "process failed: %s", strerror(errno));
1618         log_close_all();
1619         }
1620       else
1621         {
1622         for (int i = 0; i < local_queue_run_max; ++i)
1623           if (queue_runner_slots[i].pid <= 0)
1624             {
1625             queue_runner_slots[i].pid = pid;
1626             queue_runner_slots[i].queue_name = q->name;
1627             q->run_count++;
1628             queue_run_count++;
1629             break;
1630             }
1631         DEBUG(D_any) debug_printf("%d queue-runner process%s running\n",
1632           queue_run_count, queue_run_count == 1 ? "" : "es");
1633         }
1634       }
1635     }
1636
1637 /* The queue run has been initiated (unless we were already running enough) */
1638
1639 #ifndef DISABLE_QUEUE_RAMP
1640 if (*queuerun_msgid)            /* it was a fast-ramp kick; dealt with */
1641   *queuerun_msgid = 0;
1642 else                            /* periodic or one-time queue run */
1643 #endif
1644   /* Set up next timer callback. Impose a minimum 1s tick,
1645   even when a run was outstanding */
1646   {
1647   int interval = next_qrunner_interval();
1648   if (interval <= 0) interval = 1;
1649
1650   sigalrm_seen = FALSE;
1651   if (qrunners)                 /* there are still periodic qrunners */
1652     {
1653     ALARM(interval);            /* set up next qrun tick */
1654     return interval;
1655     }
1656   }
1657 return 0;
1658 }
1659
1660
1661
1662
1663 static const uschar *
1664 describe_queue_runners(void)
1665 {
1666 gstring * g = NULL;
1667
1668 if (!is_multiple_qrun()) return US"no queue runs";
1669
1670 for (qrunner * q = qrunners; q; q = q->next)
1671   {
1672   g = string_catn(g, US"-q", 2);
1673   if (q->queue_2stage) g = string_catn(g, US"q", 1);
1674   if (q->name) g = string_append(g, 3, US"G", q->name, US"/");
1675   g = string_cat(g, readconf_printtime(q->interval));
1676   g = string_catn(g, US" ", 1);
1677   }
1678 gstring_trim(g, 1);
1679 gstring_release_unused(g);
1680 return string_from_gstring(g);
1681 }
1682
1683
1684 /*************************************************
1685 *              Exim Daemon Mainline              *
1686 *************************************************/
1687
1688 /* The daemon can do two jobs, either of which is optional:
1689
1690 (1) Listens for incoming SMTP calls and spawns off a sub-process to handle
1691 each one. This is requested by the -bd option, with -oX specifying the SMTP
1692 port on which to listen (for testing).
1693
1694 (2) Spawns a queue-running process every so often. This is controlled by the
1695 -q option with a an interval time. (If no time is given, a single queue run
1696 is done from the main function, and control doesn't get here.)
1697
1698 Root privilege is required in order to attach to port 25. Some systems require
1699 it when calling socket() rather than bind(). To cope with all cases, we run as
1700 root for both socket() and bind(). Some systems also require root in order to
1701 write to the pid file directory. This function must therefore be called as root
1702 if it is to work properly in all circumstances. Once the socket is bound and
1703 the pid file written, root privilege is given up if there is an exim uid.
1704
1705 There are no arguments to this function, and it never returns. */
1706
1707 void
1708 daemon_go(void)
1709 {
1710 struct passwd * pw;
1711 struct pollfd * fd_polls, * tls_watch_poll = NULL, * dnotify_poll = NULL;
1712 int listen_socket_count = 0, poll_fd_count;
1713 ip_address_item * addresses = NULL;
1714 time_t last_connection_time = (time_t)0;
1715 int local_queue_run_max = 0;
1716
1717 if (is_multiple_qrun())
1718   {
1719   /* Nuber of runner-tracking structs needed:  If the option queue_run_max has
1720   no expandable elements then it is the overall maximum; else we assume it
1721   depends on the queue name, and add them up to get the maximum.
1722   Evaluate both that and the individual limits. */
1723
1724   GET_OPTION("queue_run_max");
1725   if (Ustrchr(queue_run_max, '$') != NULL)
1726     {
1727     for (qrunner * q = qrunners; q; q = q->next)
1728       {
1729       queue_name = q->name;
1730       local_queue_run_max +=
1731         (q->run_max = atoi(CS expand_string(queue_run_max)));
1732       }
1733     queue_name = US"";
1734     }
1735   else
1736     {
1737     local_queue_run_max = atoi(CS expand_string(queue_run_max));
1738     for (qrunner * q = qrunners; q; q = q->next)
1739       q->run_max = local_queue_run_max;
1740     }
1741   }
1742
1743 process_purpose = US"daemon";
1744
1745 /* If any debugging options are set, turn on the D_pid bit so that all
1746 debugging lines get the pid added. */
1747
1748 DEBUG(D_any|D_v) debug_selector |= D_pid;
1749
1750 /* Allocate enough pollstructs for inetd mode plus the ancillary sockets;
1751 also used when there are no listen sockets. */
1752
1753 fd_polls = store_get(sizeof(struct pollfd) * 3, GET_UNTAINTED);
1754
1755 if (f.inetd_wait_mode)
1756   {
1757   listen_socket_count = 1;
1758   (void) close(3);
1759   if (dup2(0, 3) == -1)
1760     log_write(0, LOG_MAIN|LOG_PANIC_DIE,
1761         "failed to dup inetd socket safely away: %s", strerror(errno));
1762
1763   fd_polls[0].fd = 3;
1764   fd_polls[0].events = POLLIN;
1765   (void) close(0);
1766   (void) close(1);
1767   (void) close(2);
1768   exim_nullstd();
1769
1770   if (debug_file == stderr)
1771     {
1772     /* need a call to log_write before call to open debug_file, so that
1773     log.c:file_path has been initialised.  This is unfortunate. */
1774     log_write(0, LOG_MAIN, "debugging Exim in inetd wait mode starting");
1775
1776     fclose(debug_file);
1777     debug_file = NULL;
1778     exim_nullstd(); /* re-open fd2 after we just closed it again */
1779     debug_logging_activate(US"-wait", NULL);
1780     }
1781
1782   DEBUG(D_any) debug_printf("running in inetd wait mode\n");
1783
1784   /* As per below, when creating sockets ourselves, we handle tcp_nodelay for
1785   our own buffering; we assume though that inetd set the socket REUSEADDR. */
1786
1787   if (tcp_nodelay)
1788     if (setsockopt(3, IPPROTO_TCP, TCP_NODELAY, US &on, sizeof(on)))
1789       log_write(0, LOG_MAIN|LOG_PANIC_DIE, "failed to set socket NODELAY: %s",
1790         strerror(errno));
1791   }
1792
1793
1794 if (f.inetd_wait_mode || f.daemon_listen)
1795   {
1796   /* If any option requiring a load average to be available during the
1797   reception of a message is set, call os_getloadavg() while we are root
1798   for those OS for which this is necessary the first time it is called (in
1799   order to perform an "open" on the kernel memory file). */
1800
1801 #ifdef LOAD_AVG_NEEDS_ROOT
1802   if (queue_only_load >= 0 || smtp_load_reserve >= 0 ||
1803        (deliver_queue_load_max >= 0 && deliver_drop_privilege))
1804     (void)os_getloadavg();
1805 #endif
1806   }
1807
1808
1809 /* Do the preparation for setting up a listener on one or more interfaces, and
1810 possible on various ports. This is controlled by the combination of
1811 local_interfaces (which can set IP addresses and ports) and daemon_smtp_port
1812 (which is a list of default ports to use for those items in local_interfaces
1813 that do not specify a port). The -oX command line option can be used to
1814 override one or both of these options.
1815
1816 If local_interfaces is not set, the default is to listen on all interfaces.
1817 When it is set, it can include "all IPvx interfaces" as an item. This is useful
1818 when different ports are in use.
1819
1820 It turns out that listening on all interfaces is messy in an IPv6 world,
1821 because several different implementation approaches have been taken. This code
1822 is now supposed to work with all of them. The point of difference is whether an
1823 IPv6 socket that is listening on all interfaces will receive incoming IPv4
1824 calls or not. We also have to cope with the case when IPv6 libraries exist, but
1825 there is no IPv6 support in the kernel.
1826
1827 . On Solaris, an IPv6 socket will accept IPv4 calls, and give them as mapped
1828   addresses. However, if an IPv4 socket is also listening on all interfaces,
1829   calls are directed to the appropriate socket.
1830
1831 . On (some versions of) Linux, an IPv6 socket will accept IPv4 calls, and
1832   give them as mapped addresses, but an attempt also to listen on an IPv4
1833   socket on all interfaces causes an error.
1834
1835 . On OpenBSD, an IPv6 socket will not accept IPv4 calls. You have to set up
1836   two sockets if you want to accept both kinds of call.
1837
1838 . FreeBSD is like OpenBSD, but it has the IPV6_V6ONLY socket option, which
1839   can be turned off, to make it behave like the versions of Linux described
1840   above.
1841
1842 . I heard a report that the USAGI IPv6 stack for Linux has implemented
1843   IPV6_V6ONLY.
1844
1845 So, what we do when IPv6 is supported is as follows:
1846
1847  (1) After it is set up, the list of interfaces is scanned for wildcard
1848      addresses. If an IPv6 and an IPv4 wildcard are both found for the same
1849      port, the list is re-arranged so that they are together, with the IPv6
1850      wildcard first.
1851
1852  (2) If the creation of a wildcard IPv6 socket fails, we just log the error and
1853      carry on if an IPv4 wildcard socket for the same port follows later in the
1854      list. This allows Exim to carry on in the case when the kernel has no IPv6
1855      support.
1856
1857  (3) Having created an IPv6 wildcard socket, we try to set IPV6_V6ONLY if that
1858      option is defined. However, if setting fails, carry on regardless (but log
1859      the incident).
1860
1861  (4) If binding or listening on an IPv6 wildcard socket fails, it is a serious
1862      error.
1863
1864  (5) If binding or listening on an IPv4 wildcard socket fails with the error
1865      EADDRINUSE, and a previous interface was an IPv6 wildcard for the same
1866      port (which must have succeeded or we wouldn't have got this far), we
1867      assume we are in the situation where just a single socket is permitted,
1868      and ignore the error.
1869
1870 Phew!
1871
1872 The preparation code decodes options and sets up the relevant data. We do this
1873 first, so that we can return non-zero if there are any syntax errors, and also
1874 write to stderr. */
1875
1876 if (f.daemon_listen && !f.inetd_wait_mode)
1877   {
1878   int * default_smtp_port;
1879   int pct = 0;
1880   uschar * s;
1881   const uschar * list;
1882   uschar * local_iface_source = US"local_interfaces";
1883   ip_address_item * ipa, ** pipa;
1884
1885   /* If -oX was used, disable the writing of a pid file unless -oP was
1886   explicitly used to force it. Then scan the string given to -oX. Any items
1887   that contain neither a dot nor a colon are used to override daemon_smtp_port.
1888   Any other items are used to override local_interfaces. */
1889
1890   if (override_local_interfaces)
1891     {
1892     gstring * new_smtp_port = NULL, * new_local_interfaces = NULL;
1893
1894     if (!override_pid_file_path) write_pid = FALSE;
1895
1896     /* specifically permit change-of-separator for admins (who should be
1897     the only people getting here, but we may as well be careful) */
1898
1899     list = f.admin_user
1900       ? string_copy_taint(override_local_interfaces, GET_UNTAINTED)
1901       : override_local_interfaces;
1902
1903     for (int sep = 0; s = string_nextinlist(&list, &sep, NULL, 0); )
1904       {
1905       uschar joinstr[4];
1906       gstring ** gp = Ustrpbrk(s, ".:") ? &new_local_interfaces : &new_smtp_port;
1907       if (!*gp)
1908         {
1909         joinstr[0] = sep;
1910         joinstr[1] = ' ';
1911         *gp = string_catn(NULL, US"<", 1);
1912         }
1913
1914       *gp = string_catn(*gp, joinstr, 2);
1915       *gp = string_cat (*gp, s);
1916       }
1917
1918     if (new_smtp_port)
1919       {
1920       daemon_smtp_port = string_from_gstring(new_smtp_port);
1921       DEBUG(D_any) debug_printf("daemon_smtp_port overridden by -oX:\n  %s\n",
1922         daemon_smtp_port);
1923       }
1924
1925     if (new_local_interfaces)
1926       {
1927       local_interfaces = string_from_gstring(new_local_interfaces);
1928       local_iface_source = US"-oX data";
1929       DEBUG(D_any) debug_printf("local_interfaces overridden by -oX:\n  %s\n",
1930         local_interfaces);
1931       }
1932     }
1933
1934   /* Create a list of default SMTP ports, to be used if local_interfaces
1935   contains entries without explicit ports. First count the number of ports, then
1936   build a translated list in a vector. */
1937
1938   list = daemon_smtp_port;
1939   for (int sep = 0; s = string_nextinlist(&list, &sep, NULL, 0); )
1940     pct++;
1941   default_smtp_port = store_get((pct+1) * sizeof(int), GET_UNTAINTED);
1942   list = daemon_smtp_port;
1943   pct= 0;
1944   for (int sep = 0; s = string_nextinlist(&list, &sep, NULL, 0); pct++)
1945     if (isdigit(*s))
1946       {
1947       uschar * end;
1948       default_smtp_port[pct] = Ustrtol(s, &end, 0);
1949       if (*end)
1950         log_write(0, LOG_PANIC_DIE|LOG_CONFIG, "invalid SMTP port: %s", s);
1951       }
1952     else
1953       {
1954       struct servent * smtp_service = getservbyname(CS s, "tcp");
1955       if (!smtp_service)
1956         log_write(0, LOG_PANIC_DIE|LOG_CONFIG, "TCP port \"%s\" not found", s);
1957       default_smtp_port[pct] = ntohs(smtp_service->s_port);
1958       }
1959   default_smtp_port[pct] = 0;
1960
1961   /* Check the list of TLS-on-connect ports and do name lookups if needed */
1962
1963   list = tls_in.on_connect_ports;
1964   /* the list isn't expanded so cannot be tainted.  If it ever is we will trap here */
1965   for (int sep = 0;
1966       s = string_nextinlist(&list, &sep, big_buffer, big_buffer_size); )
1967     if (!isdigit(*s))
1968       {
1969       gstring * g = NULL;
1970
1971       list = tls_in.on_connect_ports;
1972       tls_in.on_connect_ports = NULL;
1973       sep = 0;
1974       while ((s = string_nextinlist(&list, &sep, big_buffer, big_buffer_size)))
1975         if (isdigit(*s))
1976           g = string_append_listele(g, ':', s);
1977         else
1978           {
1979           struct servent * smtp_service = getservbyname(CS s, "tcp");
1980           if (!smtp_service)
1981             log_write(0, LOG_PANIC_DIE|LOG_CONFIG, "TCP port \"%s\" not found", s);
1982           g = string_append_listele_fmt(g, ':', FALSE, "%d",
1983                                               (int)ntohs(smtp_service->s_port));
1984           }
1985
1986       if (g)
1987         tls_in.on_connect_ports = g->s;
1988       break;
1989       }
1990
1991   /* Create the list of local interfaces, possibly with ports included. This
1992   list may contain references to 0.0.0.0 and ::0 as wildcards. These special
1993   values are converted below. */
1994
1995   addresses = host_build_ifacelist(local_interfaces, local_iface_source);
1996
1997   /* In the list of IP addresses, convert 0.0.0.0 into an empty string, and ::0
1998   into the string ":". We use these to recognize wildcards in IPv4 and IPv6. In
1999   fact, many IP stacks recognize 0.0.0.0 and ::0 and handle them as wildcards
2000   anyway, but we need to know which are the wildcard addresses, and the shorter
2001   strings are neater.
2002
2003   In the same scan, fill in missing port numbers from the default list. When
2004   there is more than one item in the list, extra items are created. */
2005
2006   for (ipa = addresses; ipa; ipa = ipa->next)
2007     {
2008     if (Ustrcmp(ipa->address, "0.0.0.0") == 0)
2009       ipa->address[0] = 0;
2010     else if (Ustrcmp(ipa->address, "::0") == 0)
2011       {
2012       ipa->address[0] = ':';
2013       ipa->address[1] = 0;
2014       }
2015
2016     if (ipa->port > 0) continue;
2017
2018     if (daemon_smtp_port[0] <= 0)
2019       log_write(0, LOG_MAIN|LOG_PANIC_DIE, "no port specified for interface "
2020         "%s and daemon_smtp_port is unset; cannot start daemon",
2021         ipa->address[0] == 0 ? US"\"all IPv4\"" :
2022         ipa->address[1] == 0 ? US"\"all IPv6\"" : ipa->address);
2023
2024     ipa->port = default_smtp_port[0];
2025     for (int i = 1; default_smtp_port[i] > 0; i++)
2026       {
2027       ip_address_item * new = store_get(sizeof(ip_address_item), GET_UNTAINTED);
2028
2029       memcpy(new->address, ipa->address, Ustrlen(ipa->address) + 1);
2030       new->port = default_smtp_port[i];
2031       new->next = ipa->next;
2032       ipa->next = new;
2033       ipa = new;
2034       }
2035     }
2036
2037   /* Scan the list of addresses for wildcards. If we find an IPv4 and an IPv6
2038   wildcard for the same port, ensure that (a) they are together and (b) the
2039   IPv6 address comes first. This makes handling the messy features easier, and
2040   also simplifies the construction of the "daemon started" log line. */
2041
2042   pipa = &addresses;
2043   for (ipa = addresses; ipa; pipa = &ipa->next, ipa = ipa->next)
2044     {
2045     ip_address_item *ipa2;
2046
2047     /* Handle an IPv4 wildcard */
2048
2049     if (ipa->address[0] == 0)
2050       for (ipa2 = ipa; ipa2->next; ipa2 = ipa2->next)
2051         {
2052         ip_address_item *ipa3 = ipa2->next;
2053         if (ipa3->address[0] == ':' &&
2054             ipa3->address[1] == 0 &&
2055             ipa3->port == ipa->port)
2056           {
2057           ipa2->next = ipa3->next;
2058           ipa3->next = ipa;
2059           *pipa = ipa3;
2060           break;
2061           }
2062         }
2063
2064     /* Handle an IPv6 wildcard. */
2065
2066     else if (ipa->address[0] == ':' && ipa->address[1] == 0)
2067       for (ipa2 = ipa; ipa2->next; ipa2 = ipa2->next)
2068         {
2069         ip_address_item *ipa3 = ipa2->next;
2070         if (ipa3->address[0] == 0 && ipa3->port == ipa->port)
2071           {
2072           ipa2->next = ipa3->next;
2073           ipa3->next = ipa->next;
2074           ipa->next = ipa3;
2075           ipa = ipa3;
2076           break;
2077           }
2078         }
2079     }
2080
2081   /* Get a vector to remember all the sockets in.
2082   Two extra elements for the ancillary sockets */
2083
2084   for (ipa = addresses; ipa; ipa = ipa->next)
2085     listen_socket_count++;
2086   fd_polls = store_get(sizeof(struct pollfd) * (listen_socket_count + 2),
2087                             GET_UNTAINTED);
2088   for (struct pollfd * p = fd_polls; p < fd_polls + listen_socket_count + 2;
2089        p++)
2090     { p->fd = -1; p->events = POLLIN; }
2091
2092   } /* daemon_listen but not inetd_wait_mode */
2093
2094 if (f.daemon_listen)
2095   {
2096
2097   /* Do a sanity check on the max connects value just to save us from getting
2098   a huge amount of store. */
2099
2100   if (smtp_accept_max > 4095) smtp_accept_max = 4096;
2101
2102   /* There's no point setting smtp_accept_queue unless it is less than the max
2103   connects limit. The configuration reader ensures that the max is set if the
2104   queue-only option is set. */
2105
2106   if (smtp_accept_queue > smtp_accept_max) smtp_accept_queue = 0;
2107
2108   /* Get somewhere to keep the list of SMTP accepting pids if we are keeping
2109   track of them for total number and queue/host limits. */
2110
2111   if (smtp_accept_max > 0)
2112     {
2113     smtp_slots = store_get(smtp_accept_max * sizeof(smtp_slot), GET_UNTAINTED);
2114     for (int i = 0; i < smtp_accept_max; i++) smtp_slots[i] = empty_smtp_slot;
2115     }
2116   }
2117
2118 /* The variable background_daemon is always false when debugging, but
2119 can also be forced false in order to keep a non-debugging daemon in the
2120 foreground. If background_daemon is true, close all open file descriptors that
2121 we know about, but then re-open stdin, stdout, and stderr to /dev/null.  Also
2122 do this for inetd_wait mode.
2123
2124 This is protection against any called functions (in libraries, or in
2125 Perl, or whatever) that think they can write to stderr (or stdout). Before this
2126 was added, it was quite likely that an SMTP connection would use one of these
2127 file descriptors, in which case writing random stuff to it caused chaos.
2128
2129 Then disconnect from the controlling terminal, Most modern Unixes seem to have
2130 setsid() for getting rid of the controlling terminal. For any OS that doesn't,
2131 setsid() can be #defined as a no-op, or as something else. */
2132
2133 if (f.background_daemon || f.inetd_wait_mode)
2134   {
2135   log_close_all();    /* Just in case anything was logged earlier */
2136   search_tidyup();    /* Just in case any were used in reading the config. */
2137   (void)close(0);           /* Get rid of stdin/stdout/stderr */
2138   (void)close(1);
2139   (void)close(2);
2140   exim_nullstd();     /* Connect stdin/stdout/stderr to /dev/null */
2141   log_stderr = NULL;  /* So no attempt to copy paniclog output */
2142   }
2143
2144 if (f.background_daemon)
2145   {
2146   /* If the parent process of this one has pid == 1, we are re-initializing the
2147   daemon as the result of a SIGHUP. In this case, there is no need to do
2148   anything, because the controlling terminal has long gone. Otherwise, fork, in
2149   case current process is a process group leader (see 'man setsid' for an
2150   explanation) before calling setsid().
2151   All other forks want daemon_listen cleared. Rather than blow a register, jsut
2152   restore it here. */
2153
2154   if (getppid() != 1)
2155     {
2156     BOOL daemon_listen = f.daemon_listen;
2157     pid_t pid = exim_fork(US"daemon");
2158     if (pid < 0) log_write(0, LOG_MAIN|LOG_PANIC_DIE,
2159       "fork() failed when starting daemon: %s", strerror(errno));
2160     if (pid > 0) exim_exit(EXIT_SUCCESS); /* in parent process, just exit */
2161     (void)setsid();                       /* release controlling terminal */
2162     f.daemon_listen = daemon_listen;
2163     }
2164   }
2165
2166 /* We are now in the disconnected, daemon process (unless debugging). Set up
2167 the listening sockets if required. */
2168
2169 daemon_notifier_socket();
2170
2171 if (f.daemon_listen && !f.inetd_wait_mode)
2172   {
2173   int sk;
2174   ip_address_item *ipa;
2175
2176   /* For each IP address, create a socket, bind it to the appropriate port, and
2177   start listening. See comments above about IPv6 sockets that may or may not
2178   accept IPv4 calls when listening on all interfaces. We also have to cope with
2179   the case of a system with IPv6 libraries, but no IPv6 support in the kernel.
2180   listening, provided a wildcard IPv4 socket for the same port follows. */
2181
2182   for (ipa = addresses, sk = 0; sk < listen_socket_count; ipa = ipa->next, sk++)
2183     {
2184     BOOL wildcard;
2185     ip_address_item * ipa2;
2186     int fd, af;
2187
2188     if (Ustrchr(ipa->address, ':') != NULL)
2189       {
2190       af = AF_INET6;
2191       wildcard = ipa->address[1] == 0;
2192       }
2193     else
2194       {
2195       af = AF_INET;
2196       wildcard = ipa->address[0] == 0;
2197       }
2198
2199     if ((fd_polls[sk].fd = fd = ip_socket(SOCK_STREAM, af)) < 0)
2200       {
2201       if (check_special_case(0, addresses, ipa, FALSE))
2202         {
2203         log_write(0, LOG_MAIN, "Failed to create IPv6 socket for wildcard "
2204           "listening (%s): will use IPv4", strerror(errno));
2205         goto SKIP_SOCKET;
2206         }
2207       log_write(0, LOG_PANIC_DIE, "IPv%c socket creation failed: %s",
2208         af == AF_INET6 ? '6' : '4', strerror(errno));
2209       }
2210
2211     /* If this is an IPv6 wildcard socket, set IPV6_V6ONLY if that option is
2212     available. Just log failure (can get protocol not available, just like
2213     socket creation can). */
2214
2215 #ifdef IPV6_V6ONLY
2216     if (af == AF_INET6 && wildcard &&
2217         setsockopt(fd, IPPROTO_IPV6, IPV6_V6ONLY, &on, sizeof(on)) < 0)
2218       log_write(0, LOG_MAIN, "Setting IPV6_V6ONLY on daemon's IPv6 wildcard "
2219         "socket failed (%s): carrying on without it", strerror(errno));
2220 #endif  /* IPV6_V6ONLY */
2221
2222     /* Set SO_REUSEADDR so that the daemon can be restarted while a connection
2223     is being handled.  Without this, a connection will prevent reuse of the
2224     smtp port for listening. */
2225
2226     if (setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &on, sizeof(on)) < 0)
2227       log_write(0, LOG_MAIN|LOG_PANIC_DIE, "setting SO_REUSEADDR on socket "
2228         "failed when starting daemon: %s", strerror(errno));
2229
2230     /* Set TCP_NODELAY; Exim does its own buffering. There is a switch to
2231     disable this because it breaks some broken clients. */
2232
2233     if (tcp_nodelay) setsockopt(fd, IPPROTO_TCP, TCP_NODELAY, &on, sizeof(on));
2234
2235     /* Now bind the socket to the required port; if Exim is being restarted
2236     it may not always be possible to bind immediately, even with SO_REUSEADDR
2237     set, so try 10 times, waiting between each try. After 10 failures, we give
2238     up. In an IPv6 environment, if bind () fails with the error EADDRINUSE and
2239     we are doing wildcard IPv4 listening and there was a previous IPv6 wildcard
2240     address for the same port, ignore the error on the grounds that we must be
2241     in a system where the IPv6 socket accepts both kinds of call. This is
2242     necessary for (some release of) USAGI Linux; other IP stacks fail at the
2243     listen() stage instead. */
2244
2245 #ifdef TCP_FASTOPEN
2246     f.tcp_fastopen_ok = TRUE;
2247 #endif
2248     for(;;)
2249       {
2250       uschar *msg, *addr;
2251       if (ip_bind(fd, af, ipa->address, ipa->port) >= 0) break;
2252       if (check_special_case(errno, addresses, ipa, TRUE))
2253         {
2254         DEBUG(D_any) debug_printf("wildcard IPv4 bind() failed after IPv6 "
2255           "listen() success; EADDRINUSE ignored\n");
2256         (void)close(fd);
2257         goto SKIP_SOCKET;
2258         }
2259       msg = US strerror(errno);
2260       addr = wildcard
2261         ? af == AF_INET6
2262         ? US"(any IPv6)"
2263         : US"(any IPv4)"
2264         : ipa->address;
2265       if (daemon_startup_retries <= 0)
2266         log_write(0, LOG_MAIN|LOG_PANIC_DIE,
2267           "socket bind() to port %d for address %s failed: %s: "
2268           "daemon abandoned", ipa->port, addr, msg);
2269       log_write(0, LOG_MAIN, "socket bind() to port %d for address %s "
2270         "failed: %s: waiting %s before trying again (%d more %s)",
2271         ipa->port, addr, msg, readconf_printtime(daemon_startup_sleep),
2272         daemon_startup_retries, (daemon_startup_retries > 1)? "tries" : "try");
2273       daemon_startup_retries--;
2274       sleep(daemon_startup_sleep);
2275       }
2276
2277     DEBUG(D_any)
2278       if (wildcard)
2279         debug_printf("listening on all interfaces (IPv%c) port %d\n",
2280           af == AF_INET6 ? '6' : '4', ipa->port);
2281       else
2282         debug_printf("listening on %s port %d\n", ipa->address, ipa->port);
2283
2284     /* Start listening on the bound socket, establishing the maximum backlog of
2285     connections that is allowed. On success, add to the set of sockets for select
2286     and continue to the next address. */
2287
2288 #if defined(TCP_FASTOPEN) && !defined(__APPLE__)
2289     if (  f.tcp_fastopen_ok
2290        && setsockopt(fd, IPPROTO_TCP, TCP_FASTOPEN,
2291                     &smtp_connect_backlog, sizeof(smtp_connect_backlog)))
2292       {
2293       DEBUG(D_any) debug_printf("setsockopt FASTOPEN: %s\n", strerror(errno));
2294       f.tcp_fastopen_ok = FALSE;
2295       }
2296 #endif
2297     if (listen(fd, smtp_connect_backlog) >= 0)
2298       {
2299 #if defined(TCP_FASTOPEN) && defined(__APPLE__)
2300       if (  f.tcp_fastopen_ok
2301          && setsockopt(fd, IPPROTO_TCP, TCP_FASTOPEN, &on, sizeof(on)))
2302         {
2303         DEBUG(D_any) debug_printf("setsockopt FASTOPEN: %s\n", strerror(errno));
2304         f.tcp_fastopen_ok = FALSE;
2305         }
2306 #endif
2307       fd_polls[sk].fd = fd;
2308       continue;
2309       }
2310
2311     /* Listening has failed. In an IPv6 environment, as for bind(), if listen()
2312     fails with the error EADDRINUSE and we are doing IPv4 wildcard listening
2313     and there was a previous successful IPv6 wildcard listen on the same port,
2314     we want to ignore the error on the grounds that we must be in a system
2315     where the IPv6 socket accepts both kinds of call. */
2316
2317     if (!check_special_case(errno, addresses, ipa, TRUE))
2318       log_write(0, LOG_PANIC_DIE, "listen() failed on interface %s: %s",
2319         wildcard
2320         ? af == AF_INET6 ? US"(any IPv6)" : US"(any IPv4)" : ipa->address,
2321         strerror(errno));
2322
2323     DEBUG(D_any) debug_printf("wildcard IPv4 listen() failed after IPv6 "
2324       "listen() success; EADDRINUSE ignored\n");
2325     (void)close(fd);
2326
2327     /* Come here if there has been a problem with the socket which we
2328     are going to ignore. We remove the address from the chain, and back up the
2329     counts. */
2330
2331   SKIP_SOCKET:
2332     sk--;                          /* Back up the count */
2333     listen_socket_count--;         /* Reduce the total */
2334     if (ipa == addresses) addresses = ipa->next; else
2335       {
2336       for (ipa2 = addresses; ipa2->next != ipa; ipa2 = ipa2->next);
2337       ipa2->next = ipa->next;
2338       ipa = ipa2;
2339       }
2340     }          /* End of bind/listen loop for each address */
2341   }            /* End of setup for listening */
2342
2343
2344 /* If we are not listening, we want to write a pid file only if -oP was
2345 explicitly given. */
2346
2347 else if (!override_pid_file_path)
2348   write_pid = FALSE;
2349
2350 /* Write the pid to a known file for assistance in identification, if required.
2351 We do this before giving up root privilege, because on some systems it is
2352 necessary to be root in order to write into the pid file directory. There's
2353 nothing to stop multiple daemons running, as long as no more than one listens
2354 on a given TCP/IP port on the same interface(s). However, in these
2355 circumstances it gets far too complicated to mess with pid file names
2356 automatically. Consequently, Exim 4 writes a pid file only
2357
2358   (a) When running in the test harness, or
2359   (b) When -bd is used and -oX is not used, or
2360   (c) When -oP is used to supply a path.
2361
2362 The variable daemon_write_pid is used to control this. */
2363
2364 if (f.running_in_test_harness || write_pid)
2365   {
2366   const enum pid_op operation = (f.running_in_test_harness
2367      || real_uid == root_uid
2368      || (real_uid == exim_uid && !override_pid_file_path)) ? PID_WRITE : PID_CHECK;
2369   if (!operate_on_pid_file(operation, getpid()))
2370     DEBUG(D_any) debug_printf("%s pid file %s: %s\n", (operation == PID_WRITE) ? "write" : "check", pid_file_path, strerror(errno));
2371   }
2372
2373 /* Set up the handler for SIGHUP, which causes a restart of the daemon. */
2374
2375 sighup_seen = FALSE;
2376 signal(SIGHUP, sighup_handler);
2377
2378 /* Give up root privilege at this point (assuming that exim_uid and exim_gid
2379 are not root). The third argument controls the running of initgroups().
2380 Normally we do this, in order to set up the groups for the Exim user. However,
2381 if we are not root at this time - some odd installations run that way - we
2382 cannot do this. */
2383
2384 exim_setugid(exim_uid, exim_gid, geteuid()==root_uid, US"running as a daemon");
2385
2386 /* Update the originator_xxx fields so that received messages as listed as
2387 coming from Exim, not whoever started the daemon. */
2388
2389 originator_uid = exim_uid;
2390 originator_gid = exim_gid;
2391 originator_login = (pw = getpwuid(exim_uid))
2392   ? string_copy_perm(US pw->pw_name, FALSE) : US"exim";
2393
2394 /* Get somewhere to keep the list of queue-runner pids if we are keeping track
2395 of them (and also if we are doing queue runs). */
2396
2397 if (is_multiple_qrun() && local_queue_run_max > 0)
2398   {
2399   queue_runner_slot_count = local_queue_run_max;
2400   queue_runner_slots = store_get(local_queue_run_max * sizeof(runner_slot), GET_UNTAINTED);
2401   memset(queue_runner_slots, 0, local_queue_run_max * sizeof(runner_slot));
2402   }
2403
2404 /* Set up the handler for termination of child processes, and the one
2405 telling us to die. */
2406
2407 sigchld_seen = FALSE;
2408 os_non_restarting_signal(SIGCHLD, main_sigchld_handler);
2409
2410 sigterm_seen = FALSE;
2411 os_non_restarting_signal(SIGTERM, main_sigterm_handler);
2412 os_non_restarting_signal(SIGINT, main_sigterm_handler);
2413
2414 /* If we are to run the queue periodically, pretend the alarm has just gone
2415 off. This will cause the first queue-runner to get kicked off straight away.
2416 Get an initial sort of the list of queues, to prioritize the initial q-runs */
2417
2418
2419 if ((sigalrm_seen = is_multiple_qrun()))
2420   (void) next_qrunner_interval();
2421
2422 /* Log the start up of a daemon - at least one of listening or queue running
2423 must be set up. */
2424
2425 if (f.inetd_wait_mode)
2426   {
2427   uschar *p = big_buffer;
2428
2429   if (inetd_wait_timeout >= 0)
2430     sprintf(CS p, "terminating after %d seconds", inetd_wait_timeout);
2431   else
2432     sprintf(CS p, "with no wait timeout");
2433
2434   log_write(0, LOG_MAIN,
2435     "exim %s daemon started: pid=%ld, launched with listening socket, %s",
2436     version_string, getpid(), big_buffer);
2437   set_process_info("daemon(%s): pre-listening socket", version_string);
2438
2439   /* set up the timeout logic */
2440   sigalrm_seen = TRUE;
2441   }
2442
2443 else if (f.daemon_listen)
2444   {
2445   int smtp_ports = 0;
2446   int smtps_ports = 0;
2447   ip_address_item * ipa;
2448   uschar * p;
2449   const uschar * qinfo = describe_queue_runners();
2450
2451   /* Build a list of listening addresses in big_buffer, but limit it to 10
2452   items. The style is for backwards compatibility.
2453
2454   It is possible to have some ports listening for SMTPS (as opposed to TLS
2455   startted by STARTTLS), and others listening for standard SMTP. Keep their
2456   listings separate. */
2457
2458   for (int j = 0, i; j < 2; j++)
2459     for (i = 0, ipa = addresses; i < 10 && ipa; i++, ipa = ipa->next)
2460       {
2461       /* First time round, look for SMTP ports; second time round, look for
2462       SMTPS ports. Build IP+port strings. */
2463
2464       if (host_is_tls_on_connect_port(ipa->port) == (j > 0))
2465         {
2466         if (j == 0)
2467           smtp_ports++;
2468         else
2469           smtps_ports++;
2470
2471         /* Now the information about the port (and sometimes interface) */
2472
2473         if (ipa->address[0] == ':' && ipa->address[1] == 0)
2474           {                                             /* v6 wildcard */
2475           if (ipa->next && ipa->next->address[0] == 0 &&
2476               ipa->next->port == ipa->port)
2477             {
2478             ipa->log = string_sprintf(" port %d (IPv6 and IPv4)", ipa->port);
2479             (ipa = ipa->next)->log = NULL;
2480             }
2481           else if (ipa->v6_include_v4)
2482             ipa->log = string_sprintf(" port %d (IPv6 with IPv4)", ipa->port);
2483           else
2484             ipa->log = string_sprintf(" port %d (IPv6)", ipa->port);
2485           }
2486         else if (ipa->address[0] == 0)                  /* v4 wildcard */
2487           ipa->log = string_sprintf(" port %d (IPv4)", ipa->port);
2488         else                            /* check for previously-seen IP */
2489           {
2490           ip_address_item * i2;
2491           for (i2 = addresses; i2 != ipa; i2 = i2->next)
2492             if (  host_is_tls_on_connect_port(i2->port) == (j > 0)
2493                && Ustrcmp(ipa->address, i2->address) == 0
2494                )
2495               {                         /* found; append port to list */
2496               for (p = i2->log; *p; ) p++;      /* end of existing string   { */
2497               if (*--p == '}') *p = '\0';       /* drop EOL */
2498               while (isdigit(*--p)) ;           /* char before port */
2499
2500               i2->log = *p == ':'               /* no list yet?     { */
2501                 ? string_sprintf("%.*s{%s,%d}",
2502                   (int)(p - i2->log + 1), i2->log, p+1, ipa->port)
2503                 : string_sprintf("%s,%d}", i2->log, ipa->port);
2504               ipa->log = NULL;
2505               break;
2506               }
2507           if (i2 == ipa)                /* first-time IP */
2508             ipa->log = string_sprintf(" [%s]:%d", ipa->address, ipa->port);
2509           }
2510         }
2511       }
2512
2513   p = big_buffer;
2514   for (int j = 0, i; j < 2; j++)
2515     {
2516     /* First time round, look for SMTP ports; second time round, look for
2517     SMTPS ports. For the first one of each, insert leading text. */
2518
2519     if (j == 0)
2520       {
2521       if (smtp_ports > 0)
2522         p += sprintf(CS p, "SMTP on");
2523       }
2524     else
2525       if (smtps_ports > 0)
2526         p += sprintf(CS p, "%sSMTPS on",
2527           smtp_ports == 0 ? "" : " and for ");
2528
2529     /* Now the information about the port (and sometimes interface) */
2530
2531     for (i = 0, ipa = addresses; i < 10 && ipa; i++, ipa = ipa->next)
2532       if (host_is_tls_on_connect_port(ipa->port) == (j > 0))
2533         if (ipa->log)
2534           p += sprintf(CS p, "%s",  ipa->log);
2535
2536     if (ipa)
2537       p += sprintf(CS p, " ...");
2538     }
2539
2540   log_write(0, LOG_MAIN,
2541     "exim %s daemon started: pid=%ld, %s, listening for %s",
2542     version_string, getpid(), qinfo, big_buffer);
2543   set_process_info("daemon(%s): %s, listening for %s",
2544     version_string, qinfo, big_buffer);
2545   }
2546
2547 else    /* no listening sockets, only queue-runs */
2548   {
2549   const uschar * s = describe_queue_runners();
2550   log_write(0, LOG_MAIN,
2551     "exim %s daemon started: pid=%ld, %s, not listening for SMTP",
2552     version_string, getpid(), s);
2553   set_process_info("daemon(%s): %s, not listening", version_string, s);
2554   }
2555
2556 /* Do any work it might be useful to amortize over our children
2557 (eg: compile regex) */
2558
2559 dns_pattern_init();
2560 smtp_deliver_init();    /* Used for callouts */
2561
2562 #ifdef WITH_CONTENT_SCAN
2563 malware_init();
2564 #endif
2565 #ifndef DISABLE_TLS
2566 tls_daemon_init();
2567 #endif
2568
2569 /* Add ancillary sockets to the set for select */
2570
2571 poll_fd_count = listen_socket_count;
2572 #ifndef DISABLE_TLS
2573 if (tls_watch_fd >= 0)
2574   {
2575   tls_watch_poll = &fd_polls[poll_fd_count++];
2576   tls_watch_poll->fd = tls_watch_fd;
2577   tls_watch_poll->events = POLLIN;
2578   }
2579 #endif
2580 if (daemon_notifier_fd >= 0)
2581   {
2582   dnotify_poll = &fd_polls[poll_fd_count++];
2583   dnotify_poll->fd = daemon_notifier_fd;
2584   dnotify_poll->events = POLLIN;
2585   }
2586
2587 /* Close the log so it can be renamed and moved. In the few cases below where
2588 this long-running process writes to the log (always exceptional conditions), it
2589 closes the log afterwards, for the same reason. */
2590
2591 log_close_all();
2592
2593 DEBUG(D_any) debug_print_ids(US"daemon running with");
2594
2595 /* Any messages accepted via this route are going to be SMTP. */
2596
2597 smtp_input = TRUE;
2598
2599 #ifdef MEASURE_TIMING
2600 report_time_since(&timestamp_startup, US"daemon loop start");   /* testcase 0022 */
2601 #endif
2602
2603 /* Enter the never-ending loop... */
2604
2605 for (;;)
2606   {
2607   int nolisten_sleep = 60;
2608
2609   if (sigterm_seen)
2610     daemon_die();       /* Does not return */
2611
2612   /* This code is placed first in the loop, so that it gets obeyed at the
2613   start, before the first wait, for the queue-runner case, so that the first
2614   one can be started immediately.
2615
2616   The other option is that we have an inetd wait timeout specified to -bw. */
2617
2618   if (sigalrm_seen || *queuerun_msgid)
2619     if (inetd_wait_timeout > 0)
2620       daemon_inetd_wtimeout(last_connection_time);      /* Might not return */
2621     else
2622       nolisten_sleep =
2623         daemon_qrun(local_queue_run_max, fd_polls, listen_socket_count);
2624
2625
2626   /* Sleep till a connection happens if listening, and handle the connection if
2627   that is why we woke up. The FreeBSD operating system requires the use of
2628   select() before accept() because the latter function is not interrupted by
2629   a signal, and we want to wake up for SIGCHLD and SIGALRM signals. Some other
2630   OS do notice signals in accept() but it does no harm to have the select()
2631   in for all of them - and it won't then be a lurking problem for ports to
2632   new OS. In fact, the later addition of listening on specific interfaces only
2633   requires this way of working anyway. */
2634
2635   if (f.daemon_listen)
2636     {
2637     int lcount;
2638     BOOL select_failed = FALSE;
2639
2640     DEBUG(D_any) debug_printf("Listening...\n");
2641
2642     /* In rare cases we may have had a SIGCHLD signal in the time between
2643     setting the handler (below) and getting back here. If so, pretend that the
2644     select() was interrupted so that we reap the child. This might still leave
2645     a small window when a SIGCHLD could get lost. However, since we use SIGCHLD
2646     only to do the reaping more quickly, it shouldn't result in anything other
2647     than a delay until something else causes a wake-up.
2648     For the normal case, wait for either a pollable fd (eg. new connection) or
2649     or a SIGALRM (for a periodic queue run) */
2650
2651     if (sigchld_seen)
2652       {
2653       lcount = -1;
2654       errno = EINTR;
2655       }
2656     else
2657       lcount = poll(fd_polls, poll_fd_count, -1);
2658
2659     if (lcount < 0)
2660       {
2661       select_failed = TRUE;
2662       lcount = 1;
2663       }
2664
2665     /* Clean up any subprocesses that may have terminated. We need to do this
2666     here so that smtp_accept_max_per_host works when a connection to that host
2667     has completed, and we are about to accept a new one. When this code was
2668     later in the sequence, a new connection could be rejected, even though an
2669     old one had just finished. Preserve the errno from any select() failure for
2670     the use of the common select/accept error processing below. */
2671
2672       {
2673       int select_errno = errno;
2674       handle_ending_processes();
2675
2676 #ifndef DISABLE_TLS
2677       {
2678       int old_tfd;
2679       /* Create or rotate any required keys; handle (delayed) filewatch event */
2680
2681       if ((old_tfd = tls_daemon_tick()) >= 0)
2682         for (struct pollfd * p = &fd_polls[listen_socket_count];
2683              p < fd_polls + poll_fd_count; p++)
2684           if (p->fd == old_tfd) { p->fd = tls_watch_fd ; break; }
2685       }
2686 #endif
2687       errno = select_errno;
2688       }
2689
2690     /* Loop for all the sockets that are currently ready to go. If select
2691     actually failed, we have set the count to 1 and select_failed=TRUE, so as
2692     to use the common error code for select/accept below. */
2693
2694     while (lcount-- > 0)
2695       {
2696       int accept_socket = -1;
2697 #if HAVE_IPV6
2698       struct sockaddr_in6 accepted;
2699 #else
2700       struct sockaddr_in accepted;
2701 #endif
2702
2703       if (!select_failed)
2704         {
2705 #if !defined(DISABLE_TLS) && (defined(EXIM_HAVE_INOTIFY) || defined(EXIM_HAVE_KEVENT))
2706         if (tls_watch_poll && tls_watch_poll->revents & POLLIN)
2707           {
2708           tls_watch_poll->revents = 0;
2709           tls_watch_trigger_time = time(NULL);  /* Set up delayed event */
2710           tls_watch_discard_event(tls_watch_fd);
2711           break;        /* to top of daemon loop */
2712           }
2713 #endif
2714         /* Handle the daemon-notifier socket.  If it was a fast-ramp
2715         notification then queuerun_msgid will have a nonzerolength string. */
2716
2717         if (dnotify_poll && dnotify_poll->revents & POLLIN)
2718           {
2719           dnotify_poll->revents = 0;
2720           daemon_notification();
2721           break;        /* to top of daemon loop */
2722           }
2723         for (struct pollfd * p = fd_polls; p < fd_polls + listen_socket_count;
2724              p++)
2725           if (p->revents & POLLIN)
2726             {
2727             EXIM_SOCKLEN_T alen = sizeof(accepted);
2728 #if defined(__FreeBSD__) && defined(SO_LISTENQLEN)
2729             int backlog;
2730             socklen_t blen = sizeof(backlog);
2731
2732             if (  smtp_backlog_monitor > 0
2733                && getsockopt(p->fd, SOL_SOCKET, SO_LISTENQLEN, &backlog, &blen) == 0)
2734               {
2735               DEBUG(D_interface)
2736                 debug_printf("listen fd %d queue curr %d\n", p->fd, backlog);
2737               smtp_listen_backlog = backlog;
2738               }
2739
2740 #elif defined(TCP_INFO) && defined(EXIM_HAVE_TCPI_UNACKED)
2741             struct tcp_info ti;
2742             socklen_t tlen = sizeof(ti);
2743
2744             /* If monitoring the backlog is wanted, grab for later logging */
2745
2746             smtp_listen_backlog = 0;
2747             if (  smtp_backlog_monitor > 0
2748                && getsockopt(p->fd, IPPROTO_TCP, TCP_INFO, &ti, &tlen) == 0)
2749               {
2750               DEBUG(D_interface) debug_printf("listen fd %d queue max %u curr %u\n",
2751                       p->fd, ti.tcpi_sacked, ti.tcpi_unacked);
2752               smtp_listen_backlog = ti.tcpi_unacked;
2753               }
2754 #endif
2755             p->revents = 0;
2756             accept_socket = accept(p->fd, (struct sockaddr *)&accepted, &alen);
2757             break;
2758             }
2759         }
2760
2761       /* If select or accept has failed and this was not caused by an
2762       interruption, log the incident and try again. With asymmetric TCP/IP
2763       routing errors such as "No route to network" have been seen here. Also
2764       "connection reset by peer" has been seen. These cannot be classed as
2765       disastrous errors, but they could fill up a lot of log. The code in smail
2766       crashes the daemon after 10 successive failures of accept, on the grounds
2767       that some OS fail continuously. Exim originally followed suit, but this
2768       appears to have caused problems. Now it just keeps going, but instead of
2769       logging each error, it batches them up when they are continuous. */
2770
2771       if (accept_socket < 0 && errno != EINTR)
2772         {
2773         if (accept_retry_count == 0)
2774           {
2775           accept_retry_errno = errno;
2776           accept_retry_select_failed = select_failed;
2777           }
2778         else if (  errno != accept_retry_errno
2779                 || select_failed != accept_retry_select_failed
2780                 || accept_retry_count >= 50)
2781           {
2782           log_write(0, LOG_MAIN | (accept_retry_count >= 50 ? LOG_PANIC : 0),
2783             "%d %s() failure%s: %s",
2784             accept_retry_count,
2785             accept_retry_select_failed ? "select" : "accept",
2786             accept_retry_count == 1 ? "" : "s",
2787             strerror(accept_retry_errno));
2788           log_close_all();
2789           accept_retry_count = 0;
2790           accept_retry_errno = errno;
2791           accept_retry_select_failed = select_failed;
2792           }
2793         accept_retry_count++;
2794         }
2795       else if (accept_retry_count > 0)
2796         {
2797         log_write(0, LOG_MAIN, "%d %s() failure%s: %s",
2798           accept_retry_count,
2799           accept_retry_select_failed ? "select" : "accept",
2800           accept_retry_count == 1 ? "" : "s",
2801           strerror(accept_retry_errno));
2802         log_close_all();
2803         accept_retry_count = 0;
2804         }
2805
2806       /* If select/accept succeeded, deal with the connection. */
2807
2808       if (accept_socket >= 0)
2809         {
2810 #ifdef TCP_QUICKACK /* Avoid pure-ACKs while in tls protocol pingpong phase */
2811         /* Unfortunately we cannot be certain to do this before a TLS-on-connect
2812         Client Hello arrives and is acked. We do it as early as possible. */
2813         (void) setsockopt(accept_socket, IPPROTO_TCP, TCP_QUICKACK, US &off, sizeof(off));
2814 #endif
2815         if (inetd_wait_timeout)
2816           last_connection_time = time(NULL);
2817         handle_smtp_call(fd_polls, listen_socket_count, accept_socket,
2818           (struct sockaddr *)&accepted);
2819         }
2820       }
2821     }
2822
2823   /* If not listening, then just sleep for the queue interval. If we woke
2824   up early the last time for some other signal, it won't matter because
2825   the alarm signal will wake at the right time. This code originally used
2826   sleep() but it turns out that on the FreeBSD system, sleep() is not inter-
2827   rupted by signals, so it wasn't waking up for SIGALRM or SIGCHLD. Luckily
2828   select() can be used as an interruptible sleep() on all versions of Unix. */
2829
2830   else
2831     {
2832     struct pollfd p;
2833     poll(&p, 0, nolisten_sleep * 1000);
2834     handle_ending_processes();
2835     }
2836
2837   /* Re-enable the SIGCHLD handler if it has been run. It can't do it
2838   for itself, because it isn't doing the waiting itself. */
2839
2840   if (sigchld_seen)
2841     {
2842     sigchld_seen = FALSE;
2843     os_non_restarting_signal(SIGCHLD, main_sigchld_handler);
2844     }
2845
2846   /* Handle being woken by SIGHUP. We know at this point that the result
2847   of accept() has been dealt with, so we can re-exec exim safely, first
2848   closing the listening sockets so that they can be reused. Cancel any pending
2849   alarm in case it is just about to go off, and set SIGHUP to be ignored so
2850   that another HUP in quick succession doesn't clobber the new daemon before it
2851   gets going. All log files get closed by the close-on-exec flag; however, if
2852   the exec fails, we need to close the logs. */
2853
2854   if (sighup_seen)
2855     {
2856     log_write(0, LOG_MAIN, "pid %ld: SIGHUP received: re-exec daemon",
2857       getpid());
2858     close_daemon_sockets(daemon_notifier_fd, fd_polls, listen_socket_count);
2859     unlink_notifier_socket();
2860     ALARM_CLR(0);
2861     signal(SIGHUP, SIG_IGN);
2862     sighup_argv[0] = exim_path;
2863     exim_nullstd();
2864     execv(CS exim_path, (char *const *)sighup_argv);
2865     log_write(0, LOG_MAIN|LOG_PANIC_DIE, "pid %ld: exec of %s failed: %s",
2866       getpid(), exim_path, strerror(errno));
2867     log_close_all();
2868     }
2869
2870   }   /* End of main loop */
2871
2872 /* Control never reaches here */
2873 }
2874
2875 /* vi: aw ai sw=2
2876 */
2877 /* End of exim_daemon.c */