server/mpm/experimental/event/event.c - httpd - Git at Google

 /* Copyright 2001-2005 The Apache Software Foundation or its licensors, as
  * applicable.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 /**
  * This MPM tries to fix the 'keep alive problem' in HTTP.
  *
  * After a client completes the first request, the client can keep the
  * connection open to send more requests with the same socket.  This can save
  * signifigant overhead in creating TCP connections.  However, the major
  * disadvantage is that Apache traditionally keeps an entire child
  * process/thread waiting for data from the client.  To solve this problem,
  * this MPM has a dedicated thread for handling both the Listenting sockets,
  * and all sockets that are in a Keep Alive status.
  *
  * The MPM assumes the underlying apr_pollset implmentation is somewhat
  * threadsafe.  This currently is only compatible with KQueue and EPoll.  This
  * enables the MPM to avoid extra high level locking or having to wake up the
  * listener thread when a keep-alive socket needs to be sent to it.
  *
  * This MPM not preform well on older platforms that do not have very good
  * threading, like Linux with a 2.4 kernel, but this does not matter, since we
  * require EPoll or KQueue.
  *
  * For FreeBSD, use 5.3.  It is possible to run this MPM on FreeBSD 5.2.1, if
  * you use libkse (see `man libmap.conf`).
  *
  * For NetBSD, use at least 2.0.
  *
  * For Linux, you should use a 2.6 kernel, and make sure your glibc has epoll
  * support compiled in.
  *
  */

 #include "apr.h"
 #include "apr_portable.h"
 #include "apr_strings.h"
 #include "apr_file_io.h"
 #include "apr_thread_proc.h"
 #include "apr_signal.h"
 #include "apr_thread_mutex.h"
 #include "apr_proc_mutex.h"
 #include "apr_poll.h"
 #include "apr_ring.h"
 #include "apr_queue.h"
 #define APR_WANT_STRFUNC
 #include "apr_want.h"

 #if APR_HAVE_UNISTD_H
 #include <unistd.h>
 #endif
 #if APR_HAVE_SYS_SOCKET_H
 #include <sys/socket.h>
 #endif
 #if APR_HAVE_SYS_WAIT_H
 #include <sys/wait.h>
 #endif
 #ifdef HAVE_SYS_PROCESSOR_H
 #include <sys/processor.h>      /* for bindprocessor() */
 #endif

 #if !APR_HAS_THREADS
 #error The Event MPM requires APR threads, but they are unavailable.
 #endif

 #define CORE_PRIVATE

 #include "ap_config.h"
 #include "httpd.h"
 #include "http_main.h"
 #include "http_log.h"
 #include "http_config.h"        /* for read_config */
 #include "http_core.h"          /* for get_remote_host */
 #include "http_connection.h"
 #include "ap_mpm.h"
 #include "pod.h"
 #include "mpm_common.h"
 #include "ap_listen.h"
 #include "scoreboard.h"
 #include "fdqueue.h"
 #include "mpm_default.h"
 #include "http_vhost.h"

 #include <signal.h>
 #include <limits.h>             /* for INT_MAX */

 /* Limit on the total --- clients will be locked out if more servers than
  * this are needed.  It is intended solely to keep the server from crashing
  * when things get out of hand.
  *
  * We keep a hard maximum number of servers, for two reasons --- first off,
  * in case something goes seriously wrong, we want to stop the fork bomb
  * short of actually crashing the machine we're running on by filling some
  * kernel table.  Secondly, it keeps the size of the scoreboard file small
  * enough that we can read the whole thing without worrying too much about
  * the overhead.
  */
 #ifndef DEFAULT_SERVER_LIMIT
 #define DEFAULT_SERVER_LIMIT 16
 #endif

 /* Admin can't tune ServerLimit beyond MAX_SERVER_LIMIT.  We want
  * some sort of compile-time limit to help catch typos.
  */
 #ifndef MAX_SERVER_LIMIT
 #define MAX_SERVER_LIMIT 20000
 #endif

 /* Limit on the threads per process.  Clients will be locked out if more than
  * this are needed.
  *
  * We keep this for one reason it keeps the size of the scoreboard file small
  * enough that we can read the whole thing without worrying too much about
  * the overhead.
  */
 #ifndef DEFAULT_THREAD_LIMIT
 #define DEFAULT_THREAD_LIMIT 64
 #endif

 /* Admin can't tune ThreadLimit beyond MAX_THREAD_LIMIT.  We want
  * some sort of compile-time limit to help catch typos.
  */
 #ifndef MAX_THREAD_LIMIT
 #define MAX_THREAD_LIMIT 100000
 #endif

 /*
  * Actual definitions of config globals
  */

 int ap_threads_per_child = 0;   /* Worker threads per child */
 static int ap_daemons_to_start = 0;
 static int min_spare_threads = 0;
 static int max_spare_threads = 0;
 static int ap_daemons_limit = 0;
 static int server_limit = DEFAULT_SERVER_LIMIT;
 static int first_server_limit = 0;
 static int thread_limit = DEFAULT_THREAD_LIMIT;
 static int first_thread_limit = 0;
 static int changed_limit_at_restart;
 static int dying = 0;
 static int workers_may_exit = 0;
 static int start_thread_may_exit = 0;
 static int listener_may_exit = 0;
 static int requests_this_child;
 static int num_listensocks = 0;
 static int resource_shortage = 0;
 static fd_queue_t *worker_queue;
 static fd_queue_info_t *worker_queue_info;
 static int mpm_state = AP_MPMQ_STARTING;
 static int sick_child_detected;

 apr_thread_mutex_t *timeout_mutex;
 APR_RING_HEAD(timeout_head_t, conn_state_t);
 static struct timeout_head_t timeout_head, keepalive_timeout_head;

 static apr_pollset_t *event_pollset;

 /* The structure used to pass unique initialization info to each thread */
 typedef struct
 {
     int pid;
     int tid;
     int sd;
 } proc_info;

 /* Structure used to pass information to the thread responsible for
  * creating the rest of the threads.
  */
 typedef struct
 {
     apr_thread_t **threads;
     apr_thread_t *listener;
     int child_num_arg;
     apr_threadattr_t *threadattr;
 } thread_starter;

 typedef enum
 {
     PT_CSD,
     PT_ACCEPT
 } poll_type_e;

 typedef struct
 {
     poll_type_e type;
     int status;        /*XXX what is this for?  0 and 1 don't make it clear */
     void *baton;
 } listener_poll_type;

 #define ID_FROM_CHILD_THREAD(c, t)    ((c * thread_limit) + t)

 /*
  * The max child slot ever assigned, preserved across restarts.  Necessary
  * to deal with MaxClients changes across AP_SIG_GRACEFUL restarts.  We
  * use this value to optimize routines that have to scan the entire
  * scoreboard.
  */
 int ap_max_daemons_limit = -1;

 static ap_pod_t *pod;

 /* *Non*-shared http_main globals... */

 server_rec *ap_server_conf;

 /* The worker MPM respects a couple of runtime flags that can aid
  * in debugging. Setting the -DNO_DETACH flag will prevent the root process
  * from detaching from its controlling terminal. Additionally, setting
  * the -DONE_PROCESS flag (which implies -DNO_DETACH) will get you the
  * child_main loop running in the process which originally started up.
  * This gives you a pretty nice debugging environment.  (You'll get a SIGHUP
  * early in standalone_main; just continue through.  This is the server
  * trying to kill off any child processes which it might have lying
  * around --- Apache doesn't keep track of their pids, it just sends
  * SIGHUP to the process group, ignoring it in the root process.
  * Continue through and you'll be fine.).
  */

 static int one_process = 0;

 #ifdef DEBUG_SIGSTOP
 int raise_sigstop_flags;
 #endif

 static apr_pool_t *pconf;       /* Pool for config stuff */
 static apr_pool_t *pchild;      /* Pool for httpd child stuff */

 static pid_t ap_my_pid;         /* Linux getpid() doesn't work except in main
                                    thread. Use this instead */
 static pid_t parent_pid;
 static apr_os_thread_t *listener_os_thread;

 /* The LISTENER_SIGNAL signal will be sent from the main thread to the
  * listener thread to wake it up for graceful termination (what a child
  * process from an old generation does when the admin does "apachectl
  * graceful").  This signal will be blocked in all threads of a child
  * process except for the listener thread.
  */
 #define LISTENER_SIGNAL     SIGHUP

 /* An array of socket descriptors in use by each thread used to
  * perform a non-graceful (forced) shutdown of the server.
  */
 static apr_socket_t **worker_sockets;

 static void close_worker_sockets(void)
 {
     int i;
     for (i = 0; i < ap_threads_per_child; i++) {
         if (worker_sockets[i]) {
             apr_socket_close(worker_sockets[i]);
             worker_sockets[i] = NULL;
         }
     }
 }

 static void wakeup_listener(void)
 {
     listener_may_exit = 1;
     if (!listener_os_thread) {
         /* XXX there is an obscure path that this doesn't handle perfectly:
          *     right after listener thread is created but before
          *     listener_os_thread is set, the first worker thread hits an
          *     error and starts graceful termination
          */
         return;
     }
     /*
      * we should just be able to "kill(ap_my_pid, LISTENER_SIGNAL)" on all
      * platforms and wake up the listener thread since it is the only thread
      * with SIGHUP unblocked, but that doesn't work on Linux
      */
 #ifdef HAVE_PTHREAD_KILL
     pthread_kill(*listener_os_thread, LISTENER_SIGNAL);
 #else
     kill(ap_my_pid, LISTENER_SIGNAL);
 #endif
 }

 #define ST_INIT              0
 #define ST_GRACEFUL          1
 #define ST_UNGRACEFUL        2

 static int terminate_mode = ST_INIT;

 static void signal_threads(int mode)
 {
     if (terminate_mode == mode) {
         return;
     }
     terminate_mode = mode;
     mpm_state = AP_MPMQ_STOPPING;

     /* in case we weren't called from the listener thread, wake up the
      * listener thread
      */
     wakeup_listener();

     /* for ungraceful termination, let the workers exit now;
      * for graceful termination, the listener thread will notify the
      * workers to exit once it has stopped accepting new connections
      */
     if (mode == ST_UNGRACEFUL) {
         workers_may_exit = 1;
         ap_queue_interrupt_all(worker_queue);
         ap_queue_info_term(worker_queue_info);
         close_worker_sockets(); /* forcefully kill all current connections */
     }
 }

 AP_DECLARE(apr_status_t) ap_mpm_query(int query_code, int *result)
 {
     switch (query_code) {
     case AP_MPMQ_MAX_DAEMON_USED:
         *result = ap_max_daemons_limit;
         return APR_SUCCESS;
     case AP_MPMQ_IS_THREADED:
         *result = AP_MPMQ_STATIC;
         return APR_SUCCESS;
     case AP_MPMQ_IS_FORKED:
         *result = AP_MPMQ_DYNAMIC;
         return APR_SUCCESS;
     case AP_MPMQ_IS_ASYNC:
         *result = 1;
         return APR_SUCCESS;
     case AP_MPMQ_HARD_LIMIT_DAEMONS:
         *result = server_limit;
         return APR_SUCCESS;
     case AP_MPMQ_HARD_LIMIT_THREADS:
         *result = thread_limit;
         return APR_SUCCESS;
     case AP_MPMQ_MAX_THREADS:
         *result = ap_threads_per_child;
         return APR_SUCCESS;
     case AP_MPMQ_MIN_SPARE_DAEMONS:
         *result = 0;
         return APR_SUCCESS;
     case AP_MPMQ_MIN_SPARE_THREADS:
         *result = min_spare_threads;
         return APR_SUCCESS;
     case AP_MPMQ_MAX_SPARE_DAEMONS:
         *result = 0;
         return APR_SUCCESS;
     case AP_MPMQ_MAX_SPARE_THREADS:
         *result = max_spare_threads;
         return APR_SUCCESS;
     case AP_MPMQ_MAX_REQUESTS_DAEMON:
         *result = ap_max_requests_per_child;
         return APR_SUCCESS;
     case AP_MPMQ_MAX_DAEMONS:
         *result = ap_daemons_limit;
         return APR_SUCCESS;
     case AP_MPMQ_MPM_STATE:
         *result = mpm_state;
         return APR_SUCCESS;
     }
     return APR_ENOTIMPL;
 }

 /* a clean exit from a child with proper cleanup */
 static void clean_child_exit(int code) __attribute__ ((noreturn));
 static void clean_child_exit(int code)
 {
     mpm_state = AP_MPMQ_STOPPING;
     if (pchild) {
         apr_pool_destroy(pchild);
     }
     exit(code);
 }

 static void just_die(int sig)
 {
     clean_child_exit(0);
 }

 /*****************************************************************
  * Connection structures and accounting...
  */

 /* volatile just in case */
 static int volatile shutdown_pending;
 static int volatile restart_pending;
 static int volatile is_graceful;
 static volatile int child_fatal;
 ap_generation_t volatile ap_my_generation;

 /*
  * ap_start_shutdown() and ap_start_restart(), below, are a first stab at
  * functions to initiate shutdown or restart without relying on signals.
  * Previously this was initiated in sig_term() and restart() signal handlers,
  * but we want to be able to start a shutdown/restart from other sources --
  * e.g. on Win32, from the service manager. Now the service manager can
  * call ap_start_shutdown() or ap_start_restart() as appropiate.  Note that
  * these functions can also be called by the child processes, since global
  * variables are no longer used to pass on the required action to the parent.
  *
  * These should only be called from the parent process itself, since the
  * parent process will use the shutdown_pending and restart_pending variables
  * to determine whether to shutdown or restart. The child process should
  * call signal_parent() directly to tell the parent to die -- this will
  * cause neither of those variable to be set, which the parent will
  * assume means something serious is wrong (which it will be, for the
  * child to force an exit) and so do an exit anyway.
  */

 static void ap_start_shutdown(int graceful)
 {
     mpm_state = AP_MPMQ_STOPPING;
     if (shutdown_pending == 1) {
         /* Um, is this _probably_ not an error, if the user has
          * tried to do a shutdown twice quickly, so we won't
          * worry about reporting it.
          */
         return;
     }
     shutdown_pending = 1;
     is_graceful = graceful;
 }

 /* do a graceful restart if graceful == 1 */
 static void ap_start_restart(int graceful)
 {
     mpm_state = AP_MPMQ_STOPPING;
     if (restart_pending == 1) {
         /* Probably not an error - don't bother reporting it */
         return;
     }
     restart_pending = 1;
     is_graceful = graceful;
 }

 static void sig_term(int sig)
 {
     ap_start_shutdown(sig == AP_SIG_GRACEFUL_STOP);
 }

 static void restart(int sig)
 {
     ap_start_restart(sig == AP_SIG_GRACEFUL);
 }

 static void set_signals(void)
 {
 #ifndef NO_USE_SIGACTION
     struct sigaction sa;
 #endif

     if (!one_process) {
         ap_fatal_signal_setup(ap_server_conf, pconf);
     }

 #ifndef NO_USE_SIGACTION
     sigemptyset(&sa.sa_mask);
     sa.sa_flags = 0;

     sa.sa_handler = sig_term;
     if (sigaction(SIGTERM, &sa, NULL) < 0)
         ap_log_error(APLOG_MARK, APLOG_WARNING, errno, ap_server_conf,
                      "sigaction(SIGTERM)");
 #ifdef AP_SIG_GRACEFUL_STOP
     if (sigaction(AP_SIG_GRACEFUL_STOP, &sa, NULL) < 0)
         ap_log_error(APLOG_MARK, APLOG_WARNING, errno, ap_server_conf,
                      "sigaction(" AP_SIG_GRACEFUL_STOP_STRING ")");
 #endif
 #ifdef SIGINT
     if (sigaction(SIGINT, &sa, NULL) < 0)
         ap_log_error(APLOG_MARK, APLOG_WARNING, errno, ap_server_conf,
                      "sigaction(SIGINT)");
 #endif
 #ifdef SIGXCPU
     sa.sa_handler = SIG_DFL;
     if (sigaction(SIGXCPU, &sa, NULL) < 0)
         ap_log_error(APLOG_MARK, APLOG_WARNING, errno, ap_server_conf,
                      "sigaction(SIGXCPU)");
 #endif
 #ifdef SIGXFSZ
     sa.sa_handler = SIG_DFL;
     if (sigaction(SIGXFSZ, &sa, NULL) < 0)
         ap_log_error(APLOG_MARK, APLOG_WARNING, errno, ap_server_conf,
                      "sigaction(SIGXFSZ)");
 #endif
 #ifdef SIGPIPE
     sa.sa_handler = SIG_IGN;
     if (sigaction(SIGPIPE, &sa, NULL) < 0)
         ap_log_error(APLOG_MARK, APLOG_WARNING, errno, ap_server_conf,
                      "sigaction(SIGPIPE)");
 #endif

     /* we want to ignore HUPs and AP_SIG_GRACEFUL while we're busy
      * processing one */
     sigaddset(&sa.sa_mask, SIGHUP);
     sigaddset(&sa.sa_mask, AP_SIG_GRACEFUL);
     sa.sa_handler = restart;
     if (sigaction(SIGHUP, &sa, NULL) < 0)
         ap_log_error(APLOG_MARK, APLOG_WARNING, errno, ap_server_conf,
                      "sigaction(SIGHUP)");
     if (sigaction(AP_SIG_GRACEFUL, &sa, NULL) < 0)
         ap_log_error(APLOG_MARK, APLOG_WARNING, errno, ap_server_conf,
                      "sigaction(" AP_SIG_GRACEFUL_STRING ")");
 #else
     if (!one_process) {
 #ifdef SIGXCPU
         apr_signal(SIGXCPU, SIG_DFL);
 #endif /* SIGXCPU */
 #ifdef SIGXFSZ
         apr_signal(SIGXFSZ, SIG_DFL);
 #endif /* SIGXFSZ */
     }

     apr_signal(SIGTERM, sig_term);
 #ifdef SIGHUP
     apr_signal(SIGHUP, restart);
 #endif /* SIGHUP */
 #ifdef AP_SIG_GRACEFUL
     apr_signal(AP_SIG_GRACEFUL, restart);
 #endif /* AP_SIG_GRACEFUL */
 #ifdef AP_SIG_GRACEFUL_STOP
      apr_signal(AP_SIG_GRACEFUL_STOP, sig_term);
 #endif /* AP_SIG_GRACEFUL_STOP */
 #ifdef SIGPIPE
     apr_signal(SIGPIPE, SIG_IGN);
 #endif /* SIGPIPE */

 #endif
 }

 /*****************************************************************
  * Here follows a long bunch of generic server bookkeeping stuff...
  */

 int ap_graceful_stop_signalled(void)
     /* XXX this is really a bad confusing obsolete name
      * maybe it should be ap_mpm_process_exiting?
      */
 {
     /* note: for a graceful termination, listener_may_exit will be set before
      *       workers_may_exit, so check listener_may_exit
      */
     return listener_may_exit;
 }

 /*****************************************************************
  * Child process main loop.
  */

 static int process_socket(apr_pool_t * p, apr_socket_t * sock,
                           conn_state_t * cs, int my_child_num,
                           int my_thread_num)
 {
     conn_rec *c;
     listener_poll_type *pt;
     long conn_id = ID_FROM_CHILD_THREAD(my_child_num, my_thread_num);
     int csd;
     int rc;
     apr_time_t time_now = 0;
     ap_sb_handle_t *sbh;

     ap_create_sb_handle(&sbh, p, my_child_num, my_thread_num);
     apr_os_sock_get(&csd, sock);

     time_now = apr_time_now();

     if (cs == NULL) {           /* This is a new connection */

         cs = apr_pcalloc(p, sizeof(conn_state_t));

         pt = apr_pcalloc(p, sizeof(*pt));

         cs->bucket_alloc = apr_bucket_alloc_create(p);
         c = ap_run_create_connection(p, ap_server_conf, sock,
                                      conn_id, sbh, cs->bucket_alloc);
         cs->c = c;
         c->cs = cs;
         cs->p = p;
         cs->pfd.desc_type = APR_POLL_SOCKET;
         cs->pfd.reqevents = APR_POLLIN;
         cs->pfd.desc.s = sock;
         pt->type = PT_CSD;
         pt->status = 1;
         pt->baton = cs;
         cs->pfd.client_data = pt;
         APR_RING_ELEM_INIT(cs, timeout_list);

         ap_update_vhost_given_ip(c);

         rc = ap_run_pre_connection(c, sock);
         if (rc != OK && rc != DONE) {
             ap_log_error(APLOG_MARK, APLOG_DEBUG, 0, ap_server_conf,
                          "process_socket: connection aborted");
             c->aborted = 1;
         }

         /**
          * XXX If the platform does not have a usable way of bundling
          * accept() with a socket readability check, like Win32,
          * and there are measurable delays before the
          * socket is readable due to the first data packet arriving,
          * it might be better to create the cs on the listener thread
          * with the state set to CONN_STATE_CHECK_REQUEST_LINE_READABLE
          *
          * FreeBSD users will want to enable the HTTP accept filter
          * module in their kernel for the highest performance
          * When the accept filter is active, sockets are kept in the
          * kernel until a HTTP request is received.
          */
         cs->state = CONN_STATE_READ_REQUEST_LINE;

     }
     else {
         c = cs->c;
         c->sbh = sbh;
         pt = cs->pfd.client_data;
     }

 read_request:
     if (cs->state == CONN_STATE_READ_REQUEST_LINE) {
         if (!c->aborted) {
             ap_run_process_connection(c);

             /* state will be updated upon return
              * fall thru to either wait for readability/timeout or
              * do lingering close
              */
         }
         else {
             cs->state = CONN_STATE_LINGER;
         }
     }

     if (cs->state == CONN_STATE_WRITE_COMPLETION) {
         /* For now, do blocking writes in this thread to transfer the
          * rest of the response.  TODO: Hand off this connection to a
          * pollset for asynchronous write completion.
          */
         ap_filter_t *output_filter = c->output_filters;
         apr_status_t rv;
         while (output_filter->next != NULL) {
             output_filter = output_filter->next;
         }
         rv = output_filter->frec->filter_func.out_func(output_filter, NULL);
         if (rv != APR_SUCCESS) {
             ap_log_error(APLOG_MARK, APLOG_WARNING, rv, ap_server_conf,
                      "network write failure in core output filter");
             cs->state = CONN_STATE_LINGER;
         }
         else if (c->data_in_output_filters) {
             /* Still in WRITE_COMPLETION_STATE:
              * Set a write timeout for this connection, and let the
              * event thread poll for writeability.
              */
             cs->expiration_time = ap_server_conf->timeout + time_now;
             apr_thread_mutex_lock(timeout_mutex);
             APR_RING_INSERT_TAIL(&timeout_head, cs, conn_state_t, timeout_list);
             apr_thread_mutex_unlock(timeout_mutex);
             pt->status = 0;
             cs->pfd.reqevents = APR_POLLOUT | APR_POLLHUP | APR_POLLERR;
             rc = apr_pollset_add(event_pollset, &cs->pfd);
             return 1;
         }
         else if (c->keepalive != AP_CONN_KEEPALIVE || c->aborted ||
             ap_graceful_stop_signalled()) {
             c->cs->state = CONN_STATE_LINGER;
         }
         else if (c->data_in_input_filters) {
             cs->state = CONN_STATE_READ_REQUEST_LINE;
             goto read_request;
         }
         else {
             cs->state = CONN_STATE_CHECK_REQUEST_LINE_READABLE;
         }
     }

     if (cs->state == CONN_STATE_LINGER) {
         ap_lingering_close(c);
         apr_bucket_alloc_destroy(cs->bucket_alloc);
         apr_pool_clear(p);
         ap_push_pool(worker_queue_info, p);
         return 1;
     }
     else if (cs->state == CONN_STATE_CHECK_REQUEST_LINE_READABLE) {
         apr_status_t rc;
         listener_poll_type *pt = (listener_poll_type *) cs->pfd.client_data;

         /* It greatly simplifies the logic to use a single timeout value here
          * because the new element can just be added to the end of the list and
          * it will stay sorted in expiration time sequence.  If brand new
          * sockets are sent to the event thread for a readability check, this
          * will be a slight behavior change - they use the non-keepalive
          * timeout today.  With a normal client, the socket will be readable in
          * a few milliseconds anyway.
          */
         cs->expiration_time = ap_server_conf->keep_alive_timeout + time_now;
         apr_thread_mutex_lock(timeout_mutex);
         APR_RING_INSERT_TAIL(&keepalive_timeout_head, cs, conn_state_t, timeout_list);
         apr_thread_mutex_unlock(timeout_mutex);

         pt->status = 0;
         /* Add work to pollset. */
         cs->pfd.reqevents = APR_POLLIN;
         rc = apr_pollset_add(event_pollset, &cs->pfd);

         if (rc != APR_SUCCESS) {
             ap_log_error(APLOG_MARK, APLOG_ERR, rc, ap_server_conf,
                          "process_socket: apr_pollset_add failure");
             AP_DEBUG_ASSERT(rc == APR_SUCCESS);
         }
     }
     return 0;
 }

 /* requests_this_child has gone to zero or below.  See if the admin coded
    "MaxRequestsPerChild 0", and keep going in that case.  Doing it this way
    simplifies the hot path in worker_thread */
 static void check_infinite_requests(void)
 {
     if (ap_max_requests_per_child) {
         signal_threads(ST_GRACEFUL);
     }
     else {
         /* wow! if you're executing this code, you may have set a record.
          * either this child process has served over 2 billion requests, or
          * you're running a threaded 2.0 on a 16 bit machine.
          *
          * I'll buy pizza and beers at Apachecon for the first person to do
          * the former without cheating (dorking with INT_MAX, or running with
          * uncommitted performance patches, for example).
          *
          * for the latter case, you probably deserve a beer too.   Greg Ames
          */

         requests_this_child = INT_MAX;  /* keep going */
     }
 }

 static void unblock_signal(int sig)
 {
     sigset_t sig_mask;

     sigemptyset(&sig_mask);
     sigaddset(&sig_mask, sig);
 #if defined(SIGPROCMASK_SETS_THREAD_MASK)
     sigprocmask(SIG_UNBLOCK, &sig_mask, NULL);
 #else
     pthread_sigmask(SIG_UNBLOCK, &sig_mask, NULL);
 #endif
 }

 static void dummy_signal_handler(int sig)
 {
     /* XXX If specifying SIG_IGN is guaranteed to unblock a syscall,
      *     then we don't need this goofy function.
      */
 }

 static apr_status_t push2worker(const apr_pollfd_t * pfd,
                                 apr_pollset_t * pollset)
 {
     listener_poll_type *pt = (listener_poll_type *) pfd->client_data;
     conn_state_t *cs = (conn_state_t *) pt->baton;
     apr_status_t rc;

     if (pt->status == 1) {
         return 0;
     }

     pt->status = 1;

     rc = apr_pollset_remove(pollset, pfd);

     /*
      * Some of the pollset backends, like KQueue or Epoll
      * automagically remove the FD if the socket is closed,
      * therefore, we can accept _SUCCESS or _NOTFOUND,
      * and we still want to keep going
      */
     if (rc != APR_SUCCESS && rc != APR_NOTFOUND) {
         cs->state = CONN_STATE_LINGER;
     }

     rc = ap_queue_push(worker_queue, cs->pfd.desc.s, cs, cs->p);
     if (rc != APR_SUCCESS) {
         /* trash the connection; we couldn't queue the connected
          * socket to a worker
          */
         apr_bucket_alloc_destroy(cs->bucket_alloc);
         apr_socket_close(cs->pfd.desc.s);
         ap_log_error(APLOG_MARK, APLOG_CRIT, rc,
                      ap_server_conf, "push2worker: ap_queue_push failed");
         apr_pool_clear(cs->p);
         ap_push_pool(worker_queue_info, cs->p);
     }

     return APR_SUCCESS;
 }

 /* get_worker:
  *     reserve a worker thread, block if all are currently busy.
  *     this prevents the worker queue from overflowing and lets
  *     other processes accept new connections in the mean time.
  */
 static int get_worker(int *have_idle_worker_p)
 {
     apr_status_t rc;

     if (!*have_idle_worker_p) {
         rc = ap_queue_info_wait_for_idler(worker_queue_info);

         if (rc == APR_SUCCESS) {
             *have_idle_worker_p = 1;
             return 1;
         }
         else {
             if (!APR_STATUS_IS_EOF(rc)) {
                 ap_log_error(APLOG_MARK, APLOG_ERR, rc, ap_server_conf,
                              "ap_queue_info_wait_for_idler failed.  "
                              "Attempting to shutdown process gracefully");
                 signal_threads(ST_GRACEFUL);
             }
             return 0;
         }
     }
     else {
         /* already reserved a worker thread - must have hit a
          * transient error on a previous pass
          */
         return 1;
     }
 }

 static void *listener_thread(apr_thread_t * thd, void *dummy)
 {
     apr_status_t rc;
     proc_info *ti = dummy;
     int process_slot = ti->pid;
     apr_pool_t *tpool = apr_thread_pool_get(thd);
     void *csd = NULL;
     apr_pool_t *ptrans;         /* Pool for per-transaction stuff */
     ap_listen_rec *lr;
     int have_idle_worker = 0;
     conn_state_t *cs;
     const apr_pollfd_t *out_pfd;
     apr_int32_t num = 0;
     apr_time_t time_now = 0;
     apr_interval_time_t timeout_interval;
     apr_time_t timeout_time;
     listener_poll_type *pt;

     free(ti);

     /* We set this to force apr_pollset to wakeup if there hasn't been any IO
      * on any of its sockets.  This allows sockets to have been added
      * when no other keepalive operations where going on.
      *
      * current value is 1 second
      */
     timeout_interval = 1000000;

     /* the following times out events that are really close in the future
      *   to prevent extra poll calls
      *
      * current value is .1 second
      */
 #define TIMEOUT_FUDGE_FACTOR 100000

     rc = apr_thread_mutex_create(&timeout_mutex, APR_THREAD_MUTEX_DEFAULT,
                                  tpool);
     if (rc != APR_SUCCESS) {
         ap_log_error(APLOG_MARK, APLOG_ERR, rc, ap_server_conf,
                      "creation of the timeout mutex failed.  Attempting to "
                      "shutdown process gracefully");
         signal_threads(ST_GRACEFUL);
         return NULL;
     }

     APR_RING_INIT(&timeout_head, conn_state_t, timeout_list);
     APR_RING_INIT(&keepalive_timeout_head, conn_state_t, timeout_list);

     /* Create the main pollset */
     rc = apr_pollset_create(&event_pollset,
                             ap_threads_per_child,
                             tpool, APR_POLLSET_THREADSAFE | APR_POLLSET_NOCOPY);
     if (rc != APR_SUCCESS) {
         ap_log_error(APLOG_MARK, APLOG_ERR, rc, ap_server_conf,
                      "apr_pollset_create with Thread Safety failed. "
                      "Attempting to shutdown process gracefully");
         signal_threads(ST_GRACEFUL);
         return NULL;
     }

     for (lr = ap_listeners; lr != NULL; lr = lr->next) {
         apr_pollfd_t *pfd = apr_palloc(tpool, sizeof(*pfd));
         pt = apr_pcalloc(tpool, sizeof(*pt));
         pfd->desc_type = APR_POLL_SOCKET;
         pfd->desc.s = lr->sd;
         pfd->reqevents = APR_POLLIN;

         pt->type = PT_ACCEPT;
         pt->baton = lr;

         pfd->client_data = pt;

         apr_socket_opt_set(pfd->desc.s, APR_SO_NONBLOCK, 1);
         apr_pollset_add(event_pollset, pfd);
     }

     /* Unblock the signal used to wake this thread up, and set a handler for
      * it.
      */
     unblock_signal(LISTENER_SIGNAL);
     apr_signal(LISTENER_SIGNAL, dummy_signal_handler);

     while (!listener_may_exit) {

         if (requests_this_child <= 0) {
             check_infinite_requests();
         }

         rc = apr_pollset_poll(event_pollset, timeout_interval, &num,
                               &out_pfd);

         if (rc != APR_SUCCESS) {
             if (APR_STATUS_IS_EINTR(rc)) {
                 continue;
             }
             if (!APR_STATUS_IS_TIMEUP(rc)) {
                 ap_log_error(APLOG_MARK, APLOG_ERR, rc, ap_server_conf,
                              "apr_pollset_poll failed.  Attempting to "
                              "shutdown process gracefully");
                 signal_threads(ST_GRACEFUL);
             }
         }

         if (listener_may_exit)
             break;

         while (num && get_worker(&have_idle_worker)) {
             pt = (listener_poll_type *) out_pfd->client_data;
             if (pt->type == PT_CSD) {
                 /* one of the sockets is readable */
                 cs = (conn_state_t *) pt->baton;
                 switch (cs->state) {
                 case CONN_STATE_CHECK_REQUEST_LINE_READABLE:
                     cs->state = CONN_STATE_READ_REQUEST_LINE;
                     break;
                 case CONN_STATE_WRITE_COMPLETION:
                     break;
                 default:
                     ap_log_error(APLOG_MARK, APLOG_ERR, rc,
                                  ap_server_conf,
                                  "event_loop: unexpected state %d",
                                  cs->state);
                     AP_DEBUG_ASSERT(0);
                 }

                 apr_thread_mutex_lock(timeout_mutex);
                 APR_RING_REMOVE(cs, timeout_list);
                 apr_thread_mutex_unlock(timeout_mutex);
                 APR_RING_ELEM_INIT(cs, timeout_list);

                 rc = push2worker(out_pfd, event_pollset);
                 if (rc != APR_SUCCESS) {
                     ap_log_error(APLOG_MARK, APLOG_CRIT, rc,
                                  ap_server_conf, "push2worker failed");
                 }
                 else {
                     have_idle_worker = 0;
                 }
             }
             else {
                 /* A Listener Socket is ready for an accept() */

                 lr = (ap_listen_rec *) pt->baton;

                 ap_pop_pool(&ptrans, worker_queue_info);

                 if (ptrans == NULL) {
                     /* create a new transaction pool for each accepted socket */
                     apr_allocator_t *allocator;

                     apr_allocator_create(&allocator);
                     apr_allocator_max_free_set(allocator,
                                                ap_max_mem_free);
                     apr_pool_create_ex(&ptrans, pconf, NULL, allocator);
                     apr_allocator_owner_set(allocator, ptrans);
                     if (ptrans == NULL) {
                         ap_log_error(APLOG_MARK, APLOG_CRIT, rc,
                                      ap_server_conf,
                                      "Failed to create transaction pool");
                         signal_threads(ST_GRACEFUL);
                         return NULL;
                     }
                 }

                 apr_pool_tag(ptrans, "transaction");

                 rc = lr->accept_func(&csd, lr, ptrans);

                 /* later we trash rv and rely on csd to indicate
                  * success/failure
                  */
                 AP_DEBUG_ASSERT(rc == APR_SUCCESS || !csd);

                 if (rc == APR_EGENERAL) {
                     /* E[NM]FILE, ENOMEM, etc */
                     resource_shortage = 1;
                     signal_threads(ST_GRACEFUL);
                 }

                 if (csd != NULL) {
                     rc = ap_queue_push(worker_queue, csd, NULL, ptrans);
                     if (rc != APR_SUCCESS) {
                         /* trash the connection; we couldn't queue the connected
                          * socket to a worker
                          */
                         apr_socket_close(csd);
                         ap_log_error(APLOG_MARK, APLOG_CRIT, rc,
                                      ap_server_conf,
                                      "ap_queue_push failed");
                         apr_pool_clear(ptrans);
                         ap_push_pool(worker_queue_info, ptrans);
                     }
                     else {
                         have_idle_worker = 0;
                     }
                 }
                 else {
                     apr_pool_clear(ptrans);
                     ap_push_pool(worker_queue_info, ptrans);
                 }
             }               /* if:else on pt->type */
             out_pfd++;
             num--;
         }                   /* while for processing poll */

         /* XXX possible optimization: stash the current time for use as
          * r->request_time for new requests
          */
         time_now = apr_time_now();

         /* handle timed out sockets */
         apr_thread_mutex_lock(timeout_mutex);

         /* Step 1: keepalive timeouts */
         cs = APR_RING_FIRST(&keepalive_timeout_head);
         timeout_time = time_now + TIMEOUT_FUDGE_FACTOR;
         while (!APR_RING_EMPTY(&keepalive_timeout_head, conn_state_t, timeout_list)
                && cs->expiration_time < timeout_time
                && get_worker(&have_idle_worker)) {

             cs->state = CONN_STATE_LINGER;

             APR_RING_REMOVE(cs, timeout_list);

             rc = push2worker(&cs->pfd, event_pollset);

             if (rc != APR_SUCCESS) {
                 return NULL;
                 /* XXX return NULL looks wrong - not an init failure
                  * that bypasses all the cleanup outside the main loop
                  * break seems more like it
                  * need to evaluate seriousness of push2worker failures
                  */
             }
             have_idle_worker = 0;
             cs = APR_RING_FIRST(&keepalive_timeout_head);
         }

         /* Step 2: write completion timeouts */
         cs = APR_RING_FIRST(&timeout_head);
         while (!APR_RING_EMPTY(&timeout_head, conn_state_t, timeout_list)
                && cs->expiration_time < timeout_time
                && get_worker(&have_idle_worker)) {

             cs->state = CONN_STATE_LINGER;
             APR_RING_REMOVE(cs, timeout_list);
             rc = push2worker(&cs->pfd, event_pollset);
             if (rc != APR_SUCCESS) {
                 return NULL;
             }
             have_idle_worker = 0;
             cs = APR_RING_FIRST(&timeout_head);
         }

         apr_thread_mutex_unlock(timeout_mutex);

     }     /* listener main loop */

     ap_close_listeners();
     ap_queue_term(worker_queue);
     dying = 1;
     ap_scoreboard_image->parent[process_slot].quiescing = 1;

     /* wake up the main thread */
     kill(ap_my_pid, SIGTERM);

     apr_thread_exit(thd, APR_SUCCESS);
     return NULL;
 }

 /* XXX For ungraceful termination/restart, we definitely don't want to
  *     wait for active connections to finish but we may want to wait
  *     for idle workers to get out of the queue code and release mutexes,
  *     since those mutexes are cleaned up pretty soon and some systems
  *     may not react favorably (i.e., segfault) if operations are attempted
  *     on cleaned-up mutexes.
  */
 static void *APR_THREAD_FUNC worker_thread(apr_thread_t * thd, void *dummy)
 {
     proc_info *ti = dummy;
     int process_slot = ti->pid;
     int thread_slot = ti->tid;
     apr_socket_t *csd = NULL;
     conn_state_t *cs;
     apr_pool_t *ptrans;         /* Pool for per-transaction stuff */
     apr_status_t rv;
     int is_idle = 0;

     free(ti);

     ap_scoreboard_image->servers[process_slot][thread_slot].pid = ap_my_pid;
     ap_scoreboard_image->servers[process_slot][thread_slot].generation = ap_my_generation;
     ap_update_child_status_from_indexes(process_slot, thread_slot,
                                         SERVER_STARTING, NULL);

     while (!workers_may_exit) {
         if (!is_idle) {
             rv = ap_queue_info_set_idle(worker_queue_info, NULL);
             if (rv != APR_SUCCESS) {
                 ap_log_error(APLOG_MARK, APLOG_EMERG, rv, ap_server_conf,
                              "ap_queue_info_set_idle failed. Attempting to "
                              "shutdown process gracefully.");
                 signal_threads(ST_GRACEFUL);
                 break;
             }
             is_idle = 1;
         }

         ap_update_child_status_from_indexes(process_slot, thread_slot,
                                             SERVER_READY, NULL);
       worker_pop:
         if (workers_may_exit) {
             break;
         }
         rv = ap_queue_pop(worker_queue, &csd, &cs, &ptrans);

         if (rv != APR_SUCCESS) {
             /* We get APR_EOF during a graceful shutdown once all the
              * connections accepted by this server process have been handled.
              */
             if (APR_STATUS_IS_EOF(rv)) {
                 break;
             }
             /* We get APR_EINTR whenever ap_queue_pop() has been interrupted
              * from an explicit call to ap_queue_interrupt_all(). This allows
              * us to unblock threads stuck in ap_queue_pop() when a shutdown
              * is pending.
              *
              * If workers_may_exit is set and this is ungraceful termination/
              * restart, we are bound to get an error on some systems (e.g.,
              * AIX, which sanity-checks mutex operations) since the queue
              * may have already been cleaned up.  Don't log the "error" if
              * workers_may_exit is set.
              */
             else if (APR_STATUS_IS_EINTR(rv)) {
                 goto worker_pop;
             }
             /* We got some other error. */
             else if (!workers_may_exit) {
                 ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ap_server_conf,
                              "ap_queue_pop failed");
             }
             continue;
         }
         is_idle = 0;
         worker_sockets[thread_slot] = csd;
         rv = process_socket(ptrans, csd, cs, process_slot, thread_slot);
         if (!rv) {
             requests_this_child--;
         }
         worker_sockets[thread_slot] = NULL;
     }

     ap_update_child_status_from_indexes(process_slot, thread_slot,
                                         (dying) ? SERVER_DEAD :
                                         SERVER_GRACEFUL,
                                         (request_rec *) NULL);

     apr_thread_exit(thd, APR_SUCCESS);
     return NULL;
 }

 static int check_signal(int signum)
 {
     switch (signum) {
     case SIGTERM:
     case SIGINT:
         return 1;
     }
     return 0;
 }


 static void create_listener_thread(thread_starter * ts)
 {
     int my_child_num = ts->child_num_arg;
     apr_threadattr_t *thread_attr = ts->threadattr;
     proc_info *my_info;
     apr_status_t rv;

     my_info = (proc_info *) malloc(sizeof(proc_info));
     my_info->pid = my_child_num;
     my_info->tid = -1;          /* listener thread doesn't have a thread slot */
     my_info->sd = 0;
     rv = apr_thread_create(&ts->listener, thread_attr, listener_thread,
                            my_info, pchild);
     if (rv != APR_SUCCESS) {
         ap_log_error(APLOG_MARK, APLOG_ALERT, rv, ap_server_conf,
                      "apr_thread_create: unable to create listener thread");
         /* let the parent decide how bad this really is */
         clean_child_exit(APEXIT_CHILDSICK);
     }
     apr_os_thread_get(&listener_os_thread, ts->listener);
 }

 /* XXX under some circumstances not understood, children can get stuck
  *     in start_threads forever trying to take over slots which will
  *     never be cleaned up; for now there is an APLOG_DEBUG message issued
  *     every so often when this condition occurs
  */
 static void *APR_THREAD_FUNC start_threads(apr_thread_t * thd, void *dummy)
 {
     thread_starter *ts = dummy;
     apr_thread_t **threads = ts->threads;
     apr_threadattr_t *thread_attr = ts->threadattr;
     int child_num_arg = ts->child_num_arg;
     int my_child_num = child_num_arg;
     proc_info *my_info;
     apr_status_t rv;
     int i;
     int threads_created = 0;
     int listener_started = 0;
     int loops;
     int prev_threads_created;

     /* We must create the fd queues before we start up the listener
      * and worker threads. */
     worker_queue = apr_pcalloc(pchild, sizeof(*worker_queue));
     rv = ap_queue_init(worker_queue, ap_threads_per_child, pchild);
     if (rv != APR_SUCCESS) {
         ap_log_error(APLOG_MARK, APLOG_ALERT, rv, ap_server_conf,
                      "ap_queue_init() failed");
         clean_child_exit(APEXIT_CHILDFATAL);
     }

     rv = ap_queue_info_create(&worker_queue_info, pchild,
                               ap_threads_per_child);
     if (rv != APR_SUCCESS) {
         ap_log_error(APLOG_MARK, APLOG_ALERT, rv, ap_server_conf,
                      "ap_queue_info_create() failed");
         clean_child_exit(APEXIT_CHILDFATAL);
     }

     worker_sockets = apr_pcalloc(pchild, ap_threads_per_child
                                  * sizeof(apr_socket_t *));

     loops = prev_threads_created = 0;
     while (1) {
         /* ap_threads_per_child does not include the listener thread */
         for (i = 0; i < ap_threads_per_child; i++) {
             int status =
                 ap_scoreboard_image->servers[child_num_arg][i].status;

             if (status != SERVER_GRACEFUL && status != SERVER_DEAD) {
                 continue;
             }

             my_info = (proc_info *) malloc(sizeof(proc_info));
             if (my_info == NULL) {
                 ap_log_error(APLOG_MARK, APLOG_ALERT, errno, ap_server_conf,
                              "malloc: out of memory");
                 clean_child_exit(APEXIT_CHILDFATAL);
             }
             my_info->pid = my_child_num;
             my_info->tid = i;
             my_info->sd = 0;

             /* We are creating threads right now */
             ap_update_child_status_from_indexes(my_child_num, i,
                                                 SERVER_STARTING, NULL);
             /* We let each thread update its own scoreboard entry.  This is
              * done because it lets us deal with tid better.
              */
             rv = apr_thread_create(&threads[i], thread_attr,
                                    worker_thread, my_info, pchild);
             if (rv != APR_SUCCESS) {
                 ap_log_error(APLOG_MARK, APLOG_ALERT, rv, ap_server_conf,
                              "apr_thread_create: unable to create worker thread");
                 /* let the parent decide how bad this really is */
                 clean_child_exit(APEXIT_CHILDSICK);
             }
             threads_created++;
         }

         /* Start the listener only when there are workers available */
         if (!listener_started && threads_created) {
             create_listener_thread(ts);
             listener_started = 1;
         }


         if (start_thread_may_exit || threads_created == ap_threads_per_child) {
             break;
         }
         /* wait for previous generation to clean up an entry */
         apr_sleep(apr_time_from_sec(1));
         ++loops;
         if (loops % 120 == 0) { /* every couple of minutes */
             if (prev_threads_created == threads_created) {
                 ap_log_error(APLOG_MARK, APLOG_DEBUG, 0, ap_server_conf,
                              "child %" APR_PID_T_FMT " isn't taking over "
                              "slots very quickly (%d of %d)",
                              ap_my_pid, threads_created,
                              ap_threads_per_child);
             }
             prev_threads_created = threads_created;
         }
     }

     /* What state should this child_main process be listed as in the
      * scoreboard...?
      *  ap_update_child_status_from_indexes(my_child_num, i, SERVER_STARTING,
      *                                      (request_rec *) NULL);
      *
      *  This state should be listed separately in the scoreboard, in some kind
      *  of process_status, not mixed in with the worker threads' status.
      *  "life_status" is almost right, but it's in the worker's structure, and
      *  the name could be clearer.   gla
      */
     apr_thread_exit(thd, APR_SUCCESS);
     return NULL;
 }

 static void join_workers(apr_thread_t * listener, apr_thread_t ** threads)
 {
     int i;
     apr_status_t rv, thread_rv;

     if (listener) {
         int iter;

         /* deal with a rare timing window which affects waking up the
          * listener thread...  if the signal sent to the listener thread
          * is delivered between the time it verifies that the
          * listener_may_exit flag is clear and the time it enters a
          * blocking syscall, the signal didn't do any good...  work around
          * that by sleeping briefly and sending it again
          */

         iter = 0;
         while (iter < 10 &&
 #ifdef HAVE_PTHREAD_KILL
                pthread_kill(*listener_os_thread, 0)
 #else
                kill(ap_my_pid, 0)
 #endif
                == 0) {
             /* listener not dead yet */
             apr_sleep(apr_time_make(0, 500000));
             wakeup_listener();
             ++iter;
         }
         if (iter >= 10) {
             ap_log_error(APLOG_MARK, APLOG_DEBUG, 0, ap_server_conf,
                          "the listener thread didn't exit");
         }
         else {
             rv = apr_thread_join(&thread_rv, listener);
             if (rv != APR_SUCCESS) {
                 ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ap_server_conf,
                              "apr_thread_join: unable to join listener thread");
             }
         }
     }

     for (i = 0; i < ap_threads_per_child; i++) {
         if (threads[i]) {       /* if we ever created this thread */
             rv = apr_thread_join(&thread_rv, threads[i]);
             if (rv != APR_SUCCESS) {
                 ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ap_server_conf,
                              "apr_thread_join: unable to join worker "
                              "thread %d", i);
             }
         }
     }
 }

 static void join_start_thread(apr_thread_t * start_thread_id)
 {
     apr_status_t rv, thread_rv;

     start_thread_may_exit = 1;  /* tell it to give up in case it is still
                                  * trying to take over slots from a
                                  * previous generation
                                  */
     rv = apr_thread_join(&thread_rv, start_thread_id);
     if (rv != APR_SUCCESS) {
         ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ap_server_conf,
                      "apr_thread_join: unable to join the start " "thread");
     }
 }

 static void child_main(int child_num_arg)
 {
     apr_thread_t **threads;
     apr_status_t rv;
     thread_starter *ts;
     apr_threadattr_t *thread_attr;
     apr_thread_t *start_thread_id;

     mpm_state = AP_MPMQ_STARTING;       /* for benefit of any hooks that run as this
                                          * child initializes
                                          */
     ap_my_pid = getpid();
     ap_fatal_signal_child_setup(ap_server_conf);
     apr_pool_create(&pchild, pconf);

     /*stuff to do before we switch id's, so we have permissions. */
     ap_reopen_scoreboard(pchild, NULL, 0);

     if (unixd_setup_child()) {
         clean_child_exit(APEXIT_CHILDFATAL);
     }

     ap_run_child_init(pchild, ap_server_conf);

     /* done with init critical section */

     /* Just use the standard apr_setup_signal_thread to block all signals
      * from being received.  The child processes no longer use signals for
      * any communication with the parent process.
      */
     rv = apr_setup_signal_thread();
     if (rv != APR_SUCCESS) {
         ap_log_error(APLOG_MARK, APLOG_EMERG, rv, ap_server_conf,
                      "Couldn't initialize signal thread");
         clean_child_exit(APEXIT_CHILDFATAL);
     }

     if (ap_max_requests_per_child) {
         requests_this_child = ap_max_requests_per_child;
     }
     else {
         /* coding a value of zero means infinity */
         requests_this_child = INT_MAX;
     }

     /* Setup worker threads */

     /* clear the storage; we may not create all our threads immediately,
      * and we want a 0 entry to indicate a thread which was not created
      */
     threads = (apr_thread_t **) calloc(1,
                                        sizeof(apr_thread_t *) *
                                        ap_threads_per_child);
     if (threads == NULL) {
         ap_log_error(APLOG_MARK, APLOG_ALERT, errno, ap_server_conf,
                      "malloc: out of memory");
         clean_child_exit(APEXIT_CHILDFATAL);
     }

     ts = (thread_starter *) apr_palloc(pchild, sizeof(*ts));

     apr_threadattr_create(&thread_attr, pchild);
     /* 0 means PTHREAD_CREATE_JOINABLE */
     apr_threadattr_detach_set(thread_attr, 0);

     if (ap_thread_stacksize != 0) {
         apr_threadattr_stacksize_set(thread_attr, ap_thread_stacksize);
     }

     ts->threads = threads;
     ts->listener = NULL;
     ts->child_num_arg = child_num_arg;
     ts->threadattr = thread_attr;

     rv = apr_thread_create(&start_thread_id, thread_attr, start_threads,
                            ts, pchild);
     if (rv != APR_SUCCESS) {
         ap_log_error(APLOG_MARK, APLOG_ALERT, rv, ap_server_conf,
                      "apr_thread_create: unable to create worker thread");
         /* let the parent decide how bad this really is */
         clean_child_exit(APEXIT_CHILDSICK);
     }

     mpm_state = AP_MPMQ_RUNNING;

     /* If we are only running in one_process mode, we will want to
      * still handle signals. */
     if (one_process) {
         /* Block until we get a terminating signal. */
         apr_signal_thread(check_signal);
         /* make sure the start thread has finished; signal_threads()
          * and join_workers() depend on that
          */
         /* XXX join_start_thread() won't be awakened if one of our
          *     threads encounters a critical error and attempts to
          *     shutdown this child
          */
         join_start_thread(start_thread_id);

         /* helps us terminate a little more quickly than the dispatch of the
          * signal thread; beats the Pipe of Death and the browsers
          */
         signal_threads(ST_UNGRACEFUL);

         /* A terminating signal was received. Now join each of the
          * workers to clean them up.
          *   If the worker already exited, then the join frees
          *   their resources and returns.
          *   If the worker hasn't exited, then this blocks until
          *   they have (then cleans up).
          */
         join_workers(ts->listener, threads);
     }
     else {                      /* !one_process */
         /* remove SIGTERM from the set of blocked signals...  if one of
          * the other threads in the process needs to take us down
          * (e.g., for MaxRequestsPerChild) it will send us SIGTERM
          */
         unblock_signal(SIGTERM);
         apr_signal(SIGTERM, dummy_signal_handler);
         /* Watch for any messages from the parent over the POD */
         while (1) {
             rv = ap_mpm_pod_check(pod);
             if (rv == AP_NORESTART) {
                 /* see if termination was triggered while we slept */
                 switch (terminate_mode) {
                 case ST_GRACEFUL:
                     rv = AP_GRACEFUL;
                     break;
                 case ST_UNGRACEFUL:
                     rv = AP_RESTART;
                     break;
                 }
             }
             if (rv == AP_GRACEFUL || rv == AP_RESTART) {
                 /* make sure the start thread has finished;
                  * signal_threads() and join_workers depend on that
                  */
                 join_start_thread(start_thread_id);
                 signal_threads(rv ==
                                AP_GRACEFUL ? ST_GRACEFUL : ST_UNGRACEFUL);
                 break;
             }
         }

         /* A terminating signal was received. Now join each of the
          * workers to clean them up.
          *   If the worker already exited, then the join frees
          *   their resources and returns.
          *   If the worker hasn't exited, then this blocks until
          *   they have (then cleans up).
          */
         join_workers(ts->listener, threads);
     }

     free(threads);

     clean_child_exit(resource_shortage ? APEXIT_CHILDSICK : 0);
 }

 static int make_child(server_rec * s, int slot)
 {
     int pid;

     if (slot + 1 > ap_max_daemons_limit) {
         ap_max_daemons_limit = slot + 1;
     }

     if (one_process) {
         set_signals();
         ap_scoreboard_image->parent[slot].pid = getpid();
         child_main(slot);
     }

     if ((pid = fork()) == -1) {
         ap_log_error(APLOG_MARK, APLOG_ERR, errno, s,
                      "fork: Unable to fork new process");

         /* fork didn't succeed. Fix the scoreboard or else
          * it will say SERVER_STARTING forever and ever
          */
         ap_update_child_status_from_indexes(slot, 0, SERVER_DEAD, NULL);

         /* In case system resources are maxxed out, we don't want
            Apache running away with the CPU trying to fork over and
            over and over again. */
         apr_sleep(apr_time_from_sec(10));

         return -1;
     }

     if (!pid) {
 #ifdef HAVE_BINDPROCESSOR
         /* By default, AIX binds to a single processor.  This bit unbinds
          * children which will then bind to another CPU.
          */
         int status = bindprocessor(BINDPROCESS, (int) getpid(),
                                    PROCESSOR_CLASS_ANY);
         if (status != OK)
             ap_log_error(APLOG_MARK, APLOG_WARNING, errno,
                          ap_server_conf,
                          "processor unbind failed %d", status);
 #endif
         RAISE_SIGSTOP(MAKE_CHILD);

         apr_signal(SIGTERM, just_die);
         child_main(slot);

         clean_child_exit(0);
     }
     /* else */
     ap_scoreboard_image->parent[slot].quiescing = 0;
     ap_scoreboard_image->parent[slot].pid = pid;
     return 0;
 }

 /* start up a bunch of children */
 static void startup_children(int number_to_start)
 {
     int i;

     for (i = 0; number_to_start && i < ap_daemons_limit; ++i) {
         if (ap_scoreboard_image->parent[i].pid != 0) {
             continue;
         }
         if (make_child(ap_server_conf, i) < 0) {
             break;
         }
         --number_to_start;
     }
 }


 /*
  * idle_spawn_rate is the number of children that will be spawned on the
  * next maintenance cycle if there aren't enough idle servers.  It is
  * doubled up to MAX_SPAWN_RATE, and reset only when a cycle goes by
  * without the need to spawn.
  */
 static int idle_spawn_rate = 1;
 #ifndef MAX_SPAWN_RATE
 #define MAX_SPAWN_RATE        (32)
 #endif
 static int hold_off_on_exponential_spawning;

 static void perform_idle_server_maintenance(void)
 {
     int i, j;
     int idle_thread_count;
     worker_score *ws;
     process_score *ps;
     int free_length;
     int totally_free_length = 0;
     int free_slots[MAX_SPAWN_RATE];
     int last_non_dead;
     int total_non_dead;
     int active_thread_count = 0;

     /* initialize the free_list */
     free_length = 0;

     idle_thread_count = 0;
     last_non_dead = -1;
     total_non_dead = 0;

     for (i = 0; i < ap_daemons_limit; ++i) {
         /* Initialization to satisfy the compiler. It doesn't know
          * that ap_threads_per_child is always > 0 */
         int status = SERVER_DEAD;
         int any_dying_threads = 0;
         int any_dead_threads = 0;
         int all_dead_threads = 1;

         if (i >= ap_max_daemons_limit
             && totally_free_length == idle_spawn_rate)
             break;
         ps = &ap_scoreboard_image->parent[i];
         for (j = 0; j < ap_threads_per_child; j++) {
             ws = &ap_scoreboard_image->servers[i][j];
             status = ws->status;

             /* XXX any_dying_threads is probably no longer needed    GLA */
             any_dying_threads = any_dying_threads ||
                 (status == SERVER_GRACEFUL);
             any_dead_threads = any_dead_threads || (status == SERVER_DEAD);
             all_dead_threads = all_dead_threads &&
                 (status == SERVER_DEAD || status == SERVER_GRACEFUL);

             /* We consider a starting server as idle because we started it
              * at least a cycle ago, and if it still hasn't finished starting
              * then we're just going to swamp things worse by forking more.
              * So we hopefully won't need to fork more if we count it.
              * This depends on the ordering of SERVER_READY and SERVER_STARTING.
              */
             if (ps->pid != 0) { /* XXX just set all_dead_threads in outer
                                    for loop if no pid?  not much else matters */
                 if (status <= SERVER_READY && status != SERVER_DEAD &&
                         !ps->quiescing && ps->generation == ap_my_generation) {
                     ++idle_thread_count;
                 }
                 if (status >= SERVER_READY && status < SERVER_GRACEFUL) {
                     ++active_thread_count;
                 }
             }
         }
         if (any_dead_threads
             && totally_free_length < idle_spawn_rate
             && free_length < MAX_SPAWN_RATE
             && (!ps->pid      /* no process in the slot */
                   || ps->quiescing)) {  /* or at least one is going away */
             if (all_dead_threads) {
                 /* great! we prefer these, because the new process can
                  * start more threads sooner.  So prioritize this slot
                  * by putting it ahead of any slots with active threads.
                  *
                  * first, make room by moving a slot that's potentially still
                  * in use to the end of the array
                  */
                 free_slots[free_length] = free_slots[totally_free_length];
                 free_slots[totally_free_length++] = i;
             }
             else {
                 /* slot is still in use - back of the bus
                  */
                 free_slots[free_length] = i;
             }
             ++free_length;
         }
         /* XXX if (!ps->quiescing)     is probably more reliable  GLA */
         if (!any_dying_threads) {
             last_non_dead = i;
             ++total_non_dead;
         }
     }

     if (sick_child_detected) {
         if (active_thread_count > 0) {
             /* some child processes appear to be working.  don't kill the
              * whole server.
              */
             sick_child_detected = 0;
         }
         else {
             /* looks like a basket case.  give up.
              */
             shutdown_pending = 1;
             child_fatal = 1;
             ap_log_error(APLOG_MARK, APLOG_ALERT, 0,
                          ap_server_conf,
                          "No active workers found..."
                          " Apache is exiting!");
             /* the child already logged the failure details */
             return;
         }
     }

     ap_max_daemons_limit = last_non_dead + 1;

     if (idle_thread_count > max_spare_threads) {
         /* Kill off one child */
         ap_mpm_pod_signal(pod, TRUE);
         idle_spawn_rate = 1;
     }
     else if (idle_thread_count < min_spare_threads) {
         /* terminate the free list */
         if (free_length == 0) {
             /* only report this condition once */
             static int reported = 0;

             if (!reported) {
                 ap_log_error(APLOG_MARK, APLOG_ERR, 0,
                              ap_server_conf,
                              "server reached MaxClients setting, consider"
                              " raising the MaxClients setting");
                 reported = 1;
             }
             idle_spawn_rate = 1;
         }
         else {
             if (free_length > idle_spawn_rate) {
                 free_length = idle_spawn_rate;
             }
             if (idle_spawn_rate >= 8) {
                 ap_log_error(APLOG_MARK, APLOG_INFO, 0,
                              ap_server_conf,
                              "server seems busy, (you may need "
                              "to increase StartServers, ThreadsPerChild "
                              "or Min/MaxSpareThreads), "
                              "spawning %d children, there are around %d idle "
                              "threads, and %d total children", free_length,
                              idle_thread_count, total_non_dead);
             }
             for (i = 0; i < free_length; ++i) {
                 make_child(ap_server_conf, free_slots[i]);
             }
             /* the next time around we want to spawn twice as many if this
              * wasn't good enough, but not if we've just done a graceful
              */
             if (hold_off_on_exponential_spawning) {
                 --hold_off_on_exponential_spawning;
             }
             else if (idle_spawn_rate < MAX_SPAWN_RATE) {
                 idle_spawn_rate *= 2;
             }
         }
     }
     else {
         idle_spawn_rate = 1;
     }
 }

 static void server_main_loop(int remaining_children_to_start)
 {
     int child_slot;
     apr_exit_why_e exitwhy;
     int status, processed_status;
     apr_proc_t pid;
     int i;

     while (!restart_pending && !shutdown_pending) {
         ap_wait_or_timeout(&exitwhy, &status, &pid, pconf);

         if (pid.pid != -1) {
             processed_status = ap_process_child_status(&pid, exitwhy, status);
             if (processed_status == APEXIT_CHILDFATAL) {
                 shutdown_pending = 1;
                 child_fatal = 1;
                 return;
             }
             else if (processed_status == APEXIT_CHILDSICK) {
                 /* tell perform_idle_server_maintenance to check into this
                  * on the next timer pop
                  */
                 sick_child_detected = 1;
             }
             /* non-fatal death... note that it's gone in the scoreboard. */
             child_slot = find_child_by_pid(&pid);
             if (child_slot >= 0) {
                 for (i = 0; i < ap_threads_per_child; i++)
                     ap_update_child_status_from_indexes(child_slot, i,
                                                         SERVER_DEAD,
                                                         (request_rec *) NULL);

                 ap_scoreboard_image->parent[child_slot].pid = 0;
                 ap_scoreboard_image->parent[child_slot].quiescing = 0;
                 if (processed_status == APEXIT_CHILDSICK) {
                     /* resource shortage, minimize the fork rate */
                     idle_spawn_rate = 1;
                 }
                 else if (remaining_children_to_start
                          && child_slot < ap_daemons_limit) {
                     /* we're still doing a 1-for-1 replacement of dead
                      * children with new children
                      */
                     make_child(ap_server_conf, child_slot);
                     --remaining_children_to_start;
                 }
 #if APR_HAS_OTHER_CHILD
             }
             else if (apr_proc_other_child_alert(&pid, APR_OC_REASON_DEATH,
                                                 status) == 0) {
                 /* handled */
 #endif
             }
             else if (is_graceful) {
                 /* Great, we've probably just lost a slot in the
                  * scoreboard.  Somehow we don't know about this child.
                  */
                 ap_log_error(APLOG_MARK, APLOG_WARNING, 0,
                              ap_server_conf,
                              "long lost child came home! (pid %ld)",
                              (long) pid.pid);
             }
             /* Don't perform idle maintenance when a child dies,
              * only do it when there's a timeout.  Remember only a
              * finite number of children can die, and it's pretty
              * pathological for a lot to die suddenly.
              */
             continue;
         }
         else if (remaining_children_to_start) {
             /* we hit a 1 second timeout in which none of the previous
              * generation of children needed to be reaped... so assume
              * they're all done, and pick up the slack if any is left.
              */
             startup_children(remaining_children_to_start);
             remaining_children_to_start = 0;
             /* In any event we really shouldn't do the code below because
              * few of the servers we just started are in the IDLE state
              * yet, so we'd mistakenly create an extra server.
              */
             continue;
         }

         perform_idle_server_maintenance();
     }
 }

 int ap_mpm_run(apr_pool_t * _pconf, apr_pool_t * plog, server_rec * s)
 {
     int remaining_children_to_start;

     ap_log_pid(pconf, ap_pid_fname);

     first_server_limit = server_limit;
     first_thread_limit = thread_limit;

     if (changed_limit_at_restart) {
         ap_log_error(APLOG_MARK, APLOG_WARNING, 0, s,
                      "WARNING: Attempt to change ServerLimit or ThreadLimit "
                      "ignored during restart");
         changed_limit_at_restart = 0;
     }

     if (!is_graceful) {
         if (ap_run_pre_mpm(s->process->pool, SB_SHARED) != OK) {
             mpm_state = AP_MPMQ_STOPPING;
             return 1;
         }
         /* fix the generation number in the global score; we just got a new,
          * cleared scoreboard
          */
         ap_scoreboard_image->global->running_generation = ap_my_generation;
     }

     set_signals();
     /* Don't thrash... */
     if (max_spare_threads < min_spare_threads + ap_threads_per_child)
         max_spare_threads = min_spare_threads + ap_threads_per_child;

     /* If we're doing a graceful_restart then we're going to see a lot
      * of children exiting immediately when we get into the main loop
      * below (because we just sent them AP_SIG_GRACEFUL).  This happens pretty
      * rapidly... and for each one that exits we'll start a new one until
      * we reach at least daemons_min_free.  But we may be permitted to
      * start more than that, so we'll just keep track of how many we're
      * supposed to start up without the 1 second penalty between each fork.
      */
     remaining_children_to_start = ap_daemons_to_start;
     if (remaining_children_to_start > ap_daemons_limit) {
         remaining_children_to_start = ap_daemons_limit;
     }
     if (!is_graceful) {
         startup_children(remaining_children_to_start);
         remaining_children_to_start = 0;
     }
     else {
         /* give the system some time to recover before kicking into
          * exponential mode */
         hold_off_on_exponential_spawning = 10;
     }

     ap_log_error(APLOG_MARK, APLOG_NOTICE, 0, ap_server_conf,
                  "%s configured -- resuming normal operations",
                  ap_get_server_version());
     ap_log_error(APLOG_MARK, APLOG_INFO, 0, ap_server_conf,
                  "Server built: %s", ap_get_server_built());

     restart_pending = shutdown_pending = 0;
     mpm_state = AP_MPMQ_RUNNING;

     server_main_loop(remaining_children_to_start);
     mpm_state = AP_MPMQ_STOPPING;

     if (shutdown_pending && !is_graceful) {
         /* Time to shut down:
          * Kill child processes, tell them to call child_exit, etc...
          */
         ap_mpm_pod_killpg(pod, ap_daemons_limit, FALSE);
         ap_reclaim_child_processes(1);  /* Start with SIGTERM */

         if (!child_fatal) {
             /* cleanup pid file on normal shutdown */
             const char *pidfile = NULL;
             pidfile = ap_server_root_relative(pconf, ap_pid_fname);
             if (pidfile != NULL && unlink(pidfile) == 0)
                 ap_log_error(APLOG_MARK, APLOG_INFO, 0,
                              ap_server_conf,
                              "removed PID file %s (pid=%ld)",
                              pidfile, (long) getpid());

             ap_log_error(APLOG_MARK, APLOG_NOTICE, 0,
                          ap_server_conf, "caught SIGTERM, shutting down");
         }
         return 1;
     } else if (shutdown_pending) {
         /* Time to gracefully shut down:
          * Kill child processes, tell them to call child_exit, etc...
          */
         int active_children;
         int index;
         apr_time_t cutoff = 0;

         /* Close our listeners, and then ask our children to do same */
         ap_close_listeners();
         ap_mpm_pod_killpg(pod, ap_daemons_limit, TRUE);
         ap_relieve_child_processes();

         if (!child_fatal) {
             /* cleanup pid file on normal shutdown */
             const char *pidfile = NULL;
             pidfile = ap_server_root_relative (pconf, ap_pid_fname);
             if ( pidfile != NULL && unlink(pidfile) == 0)
                 ap_log_error(APLOG_MARK, APLOG_INFO, 0,
                              ap_server_conf,
                              "removed PID file %s (pid=%ld)",
                              pidfile, (long)getpid());

             ap_log_error(APLOG_MARK, APLOG_NOTICE, 0,
                          ap_server_conf, "caught SIGTERM, shutting down");
         }

         /* Don't really exit until each child has finished */
         shutdown_pending = 0;
         do {
             /* Pause for a second */
             apr_sleep(apr_time_from_sec(1));

             /* Relieve any children which have now exited */
             ap_relieve_child_processes();

             active_children = 0;
             for (index = 0; index < ap_daemons_limit; ++index) {
                 if (MPM_CHILD_PID(index) != 0) {
                     if (kill(MPM_CHILD_PID(index), 0) == 0) {
                             active_children = 1;
                             /* Having just one child is enough to stay around */
                             break;
                     }
                 }
             }
         } while (!shutdown_pending && active_children &&
                  (!ap_graceful_shutdown_timeout || apr_time_now() < cutoff));

         /* We might be here because we received SIGTERM, either
          * way, try and make sure that all of our processes are
          * really dead.
          */
         ap_mpm_pod_killpg(pod, ap_daemons_limit, FALSE);
         ap_reclaim_child_processes(1);

         return 1;
     }

     /* we've been told to restart */
     apr_signal(SIGHUP, SIG_IGN);

     if (one_process) {
         /* not worth thinking about */
         return 1;
     }

     /* advance to the next generation */
     /* XXX: we really need to make sure this new generation number isn't in
      * use by any of the children.
      */
     ++ap_my_generation;
     ap_scoreboard_image->global->running_generation = ap_my_generation;

     if (is_graceful) {
         ap_log_error(APLOG_MARK, APLOG_NOTICE, 0, ap_server_conf,
                      AP_SIG_GRACEFUL_STRING
                      " received.  Doing graceful restart");
         /* wake up the children...time to die.  But we'll have more soon */
         ap_mpm_pod_killpg(pod, ap_daemons_limit, TRUE);


         /* This is mostly for debugging... so that we know what is still
          * gracefully dealing with existing request.
          */

     }
     else {
         /* Kill 'em all.  Since the child acts the same on the parents SIGTERM
          * and a SIGHUP, we may as well use the same signal, because some user
          * pthreads are stealing signals from us left and right.
          */
         ap_mpm_pod_killpg(pod, ap_daemons_limit, FALSE);

         ap_reclaim_child_processes(1);  /* Start with SIGTERM */
         ap_log_error(APLOG_MARK, APLOG_NOTICE, 0, ap_server_conf,
                      "SIGHUP received.  Attempting to restart");
     }

     return 0;
 }

 /* This really should be a post_config hook, but the error log is already
  * redirected by that point, so we need to do this in the open_logs phase.
  */
 static int worker_open_logs(apr_pool_t * p, apr_pool_t * plog,
                             apr_pool_t * ptemp, server_rec * s)
 {
     apr_status_t rv;

     pconf = p;
     ap_server_conf = s;

     if ((num_listensocks = ap_setup_listeners(ap_server_conf)) < 1) {
         ap_log_error(APLOG_MARK, APLOG_ALERT | APLOG_STARTUP, 0,
                      NULL, "no listening sockets available, shutting down");
         return DONE;
     }

     if (!one_process) {
         if ((rv = ap_mpm_pod_open(pconf, &pod))) {
             ap_log_error(APLOG_MARK, APLOG_CRIT | APLOG_STARTUP, rv, NULL,
                          "Could not open pipe-of-death.");
             return DONE;
         }
     }
     return OK;
 }

 static int worker_pre_config(apr_pool_t * pconf, apr_pool_t * plog,
                              apr_pool_t * ptemp)
 {
     static int restart_num = 0;
     int no_detach, debug, foreground;
     ap_directive_t *pdir;
     ap_directive_t *max_clients = NULL;
     apr_status_t rv;

     mpm_state = AP_MPMQ_STARTING;

     /* make sure that "ThreadsPerChild" gets set before "MaxClients" */
     for (pdir = ap_conftree; pdir != NULL; pdir = pdir->next) {
         if (strncasecmp(pdir->directive, "ThreadsPerChild", 15) == 0) {
             if (!max_clients) {
                 /* we're in the clear, got ThreadsPerChild first */
                 break;
             }
             else {
                 /* now to swap the data */
                 ap_directive_t temp;

                 temp.directive = pdir->directive;
                 temp.args = pdir->args;
                 /* Make sure you don't change 'next', or you may get loops! */
                 /* XXX: first_child, parent, and data can never be set
                  * for these directives, right? -aaron */
                 temp.filename = pdir->filename;
                 temp.line_num = pdir->line_num;

                 pdir->directive = max_clients->directive;
                 pdir->args = max_clients->args;
                 pdir->filename = max_clients->filename;
                 pdir->line_num = max_clients->line_num;

                 max_clients->directive = temp.directive;
                 max_clients->args = temp.args;
                 max_clients->filename = temp.filename;
                 max_clients->line_num = temp.line_num;
                 break;
             }
         }
         else if (!max_clients
                  && strncasecmp(pdir->directive, "MaxClients", 10) == 0) {
             max_clients = pdir;
         }
     }

     debug = ap_exists_config_define("DEBUG");

     if (debug) {
         foreground = one_process = 1;
         no_detach = 0;
     }
     else {
         one_process = ap_exists_config_define("ONE_PROCESS");
         no_detach = ap_exists_config_define("NO_DETACH");
         foreground = ap_exists_config_define("FOREGROUND");
     }

     /* sigh, want this only the second time around */
     if (restart_num++ == 1) {
         is_graceful = 0;
         rv = apr_pollset_create(&event_pollset, 1, plog,
                                 APR_POLLSET_THREADSAFE | APR_POLLSET_NOCOPY);
         if (rv != APR_SUCCESS) {
             ap_log_error(APLOG_MARK, APLOG_CRIT, rv, NULL,
                          "Couldn't create a Thread Safe Pollset. "
                          "Is it supported on your platform?");
             return HTTP_INTERNAL_SERVER_ERROR;
         }
         apr_pollset_destroy(event_pollset);

         if (!one_process && !foreground) {
             rv = apr_proc_detach(no_detach ? APR_PROC_DETACH_FOREGROUND
                                  : APR_PROC_DETACH_DAEMONIZE);
             if (rv != APR_SUCCESS) {
                 ap_log_error(APLOG_MARK, APLOG_CRIT, rv, NULL,
                              "apr_proc_detach failed");
                 return HTTP_INTERNAL_SERVER_ERROR;
             }
         }
         parent_pid = ap_my_pid = getpid();
     }

     unixd_pre_config(ptemp);
     ap_listen_pre_config();
     ap_daemons_to_start = DEFAULT_START_DAEMON;
     min_spare_threads = DEFAULT_MIN_FREE_DAEMON * DEFAULT_THREADS_PER_CHILD;
     max_spare_threads = DEFAULT_MAX_FREE_DAEMON * DEFAULT_THREADS_PER_CHILD;
     ap_daemons_limit = server_limit;
     ap_threads_per_child = DEFAULT_THREADS_PER_CHILD;
     ap_pid_fname = DEFAULT_PIDLOG;
     ap_lock_fname = DEFAULT_LOCKFILE;
     ap_max_requests_per_child = DEFAULT_MAX_REQUESTS_PER_CHILD;
     ap_extended_status = 0;
 #ifdef AP_MPM_WANT_SET_MAX_MEM_FREE
     ap_max_mem_free = APR_ALLOCATOR_MAX_FREE_UNLIMITED;
 #endif

     apr_cpystrn(ap_coredump_dir, ap_server_root, sizeof(ap_coredump_dir));

     return OK;
 }

 static void event_hooks(apr_pool_t * p)
 {
     /* The worker open_logs phase must run before the core's, or stderr
      * will be redirected to a file, and the messages won't print to the
      * console.
      */
     static const char *const aszSucc[] = { "core.c", NULL };
     one_process = 0;

     ap_hook_open_logs(worker_open_logs, NULL, aszSucc, APR_HOOK_MIDDLE);
     /* we need to set the MPM state before other pre-config hooks use MPM query
      * to retrieve it, so register as REALLY_FIRST
      */
     ap_hook_pre_config(worker_pre_config, NULL, NULL, APR_HOOK_REALLY_FIRST);
 }

 static const char *set_daemons_to_start(cmd_parms *cmd, void *dummy,
                                         const char *arg)
 {
     const char *err = ap_check_cmd_context(cmd, GLOBAL_ONLY);
     if (err != NULL) {
         return err;
     }

     ap_daemons_to_start = atoi(arg);
     return NULL;
 }

 static const char *set_min_spare_threads(cmd_parms * cmd, void *dummy,
                                          const char *arg)
 {
     const char *err = ap_check_cmd_context(cmd, GLOBAL_ONLY);
     if (err != NULL) {
         return err;
     }

     min_spare_threads = atoi(arg);
     if (min_spare_threads <= 0) {
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "WARNING: detected MinSpareThreads set to non-positive.");
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "Resetting to 1 to avoid almost certain Apache failure.");
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "Please read the documentation.");
         min_spare_threads = 1;
     }

     return NULL;
 }

 static const char *set_max_spare_threads(cmd_parms * cmd, void *dummy,
                                          const char *arg)
 {
     const char *err = ap_check_cmd_context(cmd, GLOBAL_ONLY);
     if (err != NULL) {
         return err;
     }

     max_spare_threads = atoi(arg);
     return NULL;
 }

 static const char *set_max_clients(cmd_parms * cmd, void *dummy,
                                    const char *arg)
 {
     int max_clients;
     const char *err = ap_check_cmd_context(cmd, GLOBAL_ONLY);
     if (err != NULL) {
         return err;
     }

     /* It is ok to use ap_threads_per_child here because we are
      * sure that it gets set before MaxClients in the pre_config stage. */
     max_clients = atoi(arg);
     if (max_clients < ap_threads_per_child) {
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "WARNING: MaxClients (%d) must be at least as large",
                      max_clients);
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      " as ThreadsPerChild (%d). Automatically",
                      ap_threads_per_child);
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      " increasing MaxClients to %d.", ap_threads_per_child);
         max_clients = ap_threads_per_child;
     }
     ap_daemons_limit = max_clients / ap_threads_per_child;
     if ((max_clients > 0) && (max_clients % ap_threads_per_child)) {
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "WARNING: MaxClients (%d) is not an integer multiple",
                      max_clients);
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      " of ThreadsPerChild (%d), lowering MaxClients to %d",
                      ap_threads_per_child,
                      ap_daemons_limit * ap_threads_per_child);
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      " for a maximum of %d child processes,",
                      ap_daemons_limit);
         max_clients = ap_daemons_limit * ap_threads_per_child;
     }
     if (ap_daemons_limit > server_limit) {
        ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                     "WARNING: MaxClients of %d would require %d servers,",
                     max_clients, ap_daemons_limit);
        ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                     " and would exceed the ServerLimit value of %d.",
                     server_limit);
        ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                     " Automatically lowering MaxClients to %d.  To increase,",
                     server_limit * ap_threads_per_child);
        ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                     " please see the ServerLimit directive.");
        ap_daemons_limit = server_limit;
     }
     else if (ap_daemons_limit < 1) {
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "WARNING: Require MaxClients > 0, setting to 1");
         ap_daemons_limit = 1;
     }
     return NULL;
 }

 static const char *set_threads_per_child(cmd_parms * cmd, void *dummy,
                                          const char *arg)
 {
     const char *err = ap_check_cmd_context(cmd, GLOBAL_ONLY);
     if (err != NULL) {
         return err;
     }

     ap_threads_per_child = atoi(arg);
     if (ap_threads_per_child > thread_limit) {
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "WARNING: ThreadsPerChild of %d exceeds ThreadLimit "
                      "value of %d", ap_threads_per_child, thread_limit);
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "threads, lowering ThreadsPerChild to %d. To increase, "
                      "please see the", thread_limit);
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      " ThreadLimit directive.");
         ap_threads_per_child = thread_limit;
     }
     else if (ap_threads_per_child < 1) {
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "WARNING: Require ThreadsPerChild > 0, setting to 1");
         ap_threads_per_child = 1;
     }
     return NULL;
 }
 static const char *set_server_limit (cmd_parms *cmd, void *dummy, const char *arg)
 {
     int tmp_server_limit;

     const char *err = ap_check_cmd_context(cmd, GLOBAL_ONLY);
     if (err != NULL) {
         return err;
     }

     tmp_server_limit = atoi(arg);
     /* you cannot change ServerLimit across a restart; ignore
      * any such attempts
      */
     if (first_server_limit &&
         tmp_server_limit != server_limit) {
         /* how do we log a message?  the error log is a bit bucket at this
          * point; we'll just have to set a flag so that ap_mpm_run()
          * logs a warning later
          */
         changed_limit_at_restart = 1;
         return NULL;
     }
     server_limit = tmp_server_limit;

     if (server_limit > MAX_SERVER_LIMIT) {
        ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                     "WARNING: ServerLimit of %d exceeds compile time limit "
                     "of %d servers,", server_limit, MAX_SERVER_LIMIT);
        ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                     " lowering ServerLimit to %d.", MAX_SERVER_LIMIT);
        server_limit = MAX_SERVER_LIMIT;
     }
     else if (server_limit < 1) {
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "WARNING: Require ServerLimit > 0, setting to 1");
         server_limit = 1;
     }
     return NULL;
 }

 static const char *set_thread_limit(cmd_parms * cmd, void *dummy,
                                     const char *arg)
 {
     int tmp_thread_limit;

     const char *err = ap_check_cmd_context(cmd, GLOBAL_ONLY);
     if (err != NULL) {
         return err;
     }

     tmp_thread_limit = atoi(arg);
     /* you cannot change ThreadLimit across a restart; ignore
      * any such attempts
      */
     if (first_thread_limit && tmp_thread_limit != thread_limit) {
         /* how do we log a message?  the error log is a bit bucket at this
          * point; we'll just have to set a flag so that ap_mpm_run()
          * logs a warning later
          */
         changed_limit_at_restart = 1;
         return NULL;
     }
     thread_limit = tmp_thread_limit;

     if (thread_limit > MAX_THREAD_LIMIT) {
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "WARNING: ThreadLimit of %d exceeds compile time limit "
                      "of %d servers,", thread_limit, MAX_THREAD_LIMIT);
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      " lowering ThreadLimit to %d.", MAX_THREAD_LIMIT);
         thread_limit = MAX_THREAD_LIMIT;
     }
     else if (thread_limit < 1) {
         ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL,
                      "WARNING: Require ThreadLimit > 0, setting to 1");
         thread_limit = 1;
     }
     return NULL;
 }

 static const command_rec event_cmds[] = {
     UNIX_DAEMON_COMMANDS,
     LISTEN_COMMANDS,
     AP_INIT_TAKE1("StartServers", set_daemons_to_start, NULL, RSRC_CONF,
                   "Number of child processes launched at server startup"),
     AP_INIT_TAKE1("ServerLimit", set_server_limit, NULL, RSRC_CONF,
                   "Maximum number of child processes for this run of Apache"),
     AP_INIT_TAKE1("MinSpareThreads", set_min_spare_threads, NULL, RSRC_CONF,
                   "Minimum number of idle threads, to handle request spikes"),
     AP_INIT_TAKE1("MaxSpareThreads", set_max_spare_threads, NULL, RSRC_CONF,
                   "Maximum number of idle threads"),
     AP_INIT_TAKE1("MaxClients", set_max_clients, NULL, RSRC_CONF,
                   "Maximum number of threads alive at the same time"),
     AP_INIT_TAKE1("ThreadsPerChild", set_threads_per_child, NULL, RSRC_CONF,
                   "Number of threads each child creates"),
     AP_INIT_TAKE1("ThreadLimit", set_thread_limit, NULL, RSRC_CONF,
                   "Maximum number of worker threads per child process for this "
                   "run of Apache - Upper limit for ThreadsPerChild"),
     AP_GRACEFUL_SHUTDOWN_TIMEOUT_COMMAND,
     {NULL}
 };

 module AP_MODULE_DECLARE_DATA mpm_event_module = {
     MPM20_MODULE_STUFF,
     ap_mpm_rewrite_args,        /* hook to run before apache parses args */
     NULL,                       /* create per-directory config structure */
     NULL,                       /* merge per-directory config structures */
     NULL,                       /* create per-server config structure */
     NULL,                       /* merge per-server config structures */
     event_cmds,                 /* command apr_table_t */
     event_hooks                 /* register_hooks */
 };