]> git.sur5r.net Git - openldap/blobdiff - servers/slapd/daemon.c
ITS#6870 fix winsock wake_sds init
[openldap] / servers / slapd / daemon.c
index 31596c4846bdc572bed4d7016f02fc0198375154..21821aafdd6123be1e524672893c90501d247f21 100644 (file)
@@ -1,7 +1,8 @@
 /* $OpenLDAP$ */
 /* This work is part of OpenLDAP Software <http://www.openldap.org/>.
  *
- * Copyright 1998-2006 The OpenLDAP Foundation.
+ * Copyright 1998-2011 The OpenLDAP Foundation.
+ * Portions Copyright 2007 by Howard Chu, Symas Corporation.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
 
 #if defined(HAVE_SYS_EPOLL_H) && defined(HAVE_EPOLL)
 # include <sys/epoll.h>
-#endif
+#elif defined(SLAP_X_DEVPOLL) && defined(HAVE_SYS_DEVPOLL_H) && defined(HAVE_DEVPOLL)
+# include <sys/types.h>
+# include <sys/stat.h>
+# include <fcntl.h>
+# include <sys/devpoll.h>
+#endif /* ! epoll && ! /dev/poll */
 
 #ifdef HAVE_TCPD
-# include <tcpd.h>
 int allow_severity = LOG_INFO;
 int deny_severity = LOG_NOTICE;
-
-# define SLAP_STRING_UNKNOWN   STRING_UNKNOWN
-#else /* ! TCP Wrappers */
-# define SLAP_STRING_UNKNOWN   "unknown"
-#endif /* ! TCP Wrappers */
+#endif /* TCP Wrappers */
 
 #ifdef LDAP_PF_LOCAL
 # include <sys/stat.h>
@@ -62,9 +63,9 @@ int deny_severity = LOG_NOTICE;
 
 #ifdef LDAP_PF_INET6
 int slap_inet4or6 = AF_UNSPEC;
-#else
+#else /* ! INETv6 */
 int slap_inet4or6 = AF_INET;
-#endif
+#endif /* ! INETv6 */
 
 /* globals */
 time_t starttime;
@@ -72,122 +73,166 @@ ber_socket_t dtblsize;
 slap_ssf_t local_ssf = LDAP_PVT_SASL_LOCAL_SSF;
 struct runqueue_s slapd_rq;
 
+#define MAX_DAEMON_THREADS     16
+int slapd_daemon_threads = 1;
+int slapd_daemon_mask;
+
+#ifdef LDAP_TCP_BUFFER
+int slapd_tcp_rmem;
+int slapd_tcp_wmem;
+#endif /* LDAP_TCP_BUFFER */
+
 Listener **slap_listeners = NULL;
+static volatile sig_atomic_t listening = 1; /* 0 when slap_listeners closed */
 
 #ifndef SLAPD_LISTEN_BACKLOG
 #define SLAPD_LISTEN_BACKLOG 1024
-#endif
+#endif /* ! SLAPD_LISTEN_BACKLOG */
 
-static ber_socket_t wake_sds[2];
+#define        DAEMON_ID(fd)   (fd & slapd_daemon_mask)
+
+static ber_socket_t wake_sds[MAX_DAEMON_THREADS][2];
 static int emfile;
 
+static time_t chk_writetime;
+
 static volatile int waking;
 #ifdef NO_THREADS
-#define WAKE_LISTENER(w)       do { \
+#define WAKE_LISTENER(l,w)     do { \
        if ((w) && ++waking < 5) { \
-               tcp_write( wake_sds[1], "0", 1 ); \
+               tcp_write( SLAP_FD2SOCK(wake_sds[l][1]), "0", 1 ); \
        } \
-} while(0)
-#else
-#define WAKE_LISTENER(w)       do { \
+} while (0)
+#else /* ! NO_THREADS */
+#define WAKE_LISTENER(l,w)     do { \
        if (w) { \
-               tcp_write( wake_sds[1], "0", 1 ); \
+               tcp_write( SLAP_FD2SOCK(wake_sds[l][1]), "0", 1 ); \
        } \
-} while(0)
-#endif
+} while (0)
+#endif /* ! NO_THREADS */
 
 volatile sig_atomic_t slapd_shutdown = 0;
 volatile sig_atomic_t slapd_gentle_shutdown = 0;
 volatile sig_atomic_t slapd_abrupt_shutdown = 0;
 
-static struct slap_daemon {
-       ldap_pvt_thread_mutex_t sd_mutex;
-#ifdef HAVE_TCPD
-       ldap_pvt_thread_mutex_t tcpd_mutex;
+#ifdef HAVE_WINSOCK
+ldap_pvt_thread_mutex_t slapd_ws_mutex;
+SOCKET *slapd_ws_sockets;
+#define        SD_READ 1
+#define        SD_WRITE        2
+#define        SD_ACTIVE       4
+#define        SD_LISTENER     8
 #endif
 
-       ber_socket_t sd_nactives;
-       int sd_nwriters;
+#ifdef HAVE_TCPD
+static ldap_pvt_thread_mutex_t sd_tcpd_mutex;
+#endif /* TCP Wrappers */
 
-#ifdef HAVE_EPOLL
-       struct epoll_event *sd_epolls;
-       int     sd_nepolls;
-       int     *sd_index;
-       int     sd_epfd;
-       int     sd_nfds;
-#else
-#ifndef HAVE_WINSOCK
-       /* In winsock, accept() returns values higher than dtblsize
-               so don't bother with this optimization */
-       int sd_nfds;
-#endif
-       fd_set sd_actives;
-       fd_set sd_readers;
-       fd_set sd_writers;
-#endif
-} slap_daemon;
+typedef struct slap_daemon_st {
+       ldap_pvt_thread_mutex_t sd_mutex;
 
-#ifdef HAVE_EPOLL
+       ber_socket_t            sd_nactives;
+       int                     sd_nwriters;
+       int                     sd_nfds;
+
+#if defined(HAVE_EPOLL)
+       struct epoll_event      *sd_epolls;
+       int                     *sd_index;
+       int                     sd_epfd;
+#elif defined(SLAP_X_DEVPOLL) && defined(HAVE_DEVPOLL)
+       /* eXperimental */
+       struct pollfd           *sd_pollfd;
+       int                     *sd_index;
+       Listener                **sd_l;
+       int                     sd_dpfd;
+#else /* ! epoll && ! /dev/poll */
+#ifdef HAVE_WINSOCK
+       char    *sd_flags;
+       char    *sd_rflags;
+#else /* ! HAVE_WINSOCK */
+       fd_set                  sd_actives;
+       fd_set                  sd_readers;
+       fd_set                  sd_writers;
+#endif /* ! HAVE_WINSOCK */
+#endif /* ! epoll && ! /dev/poll */
+} slap_daemon_st;
+
+static slap_daemon_st slap_daemon[MAX_DAEMON_THREADS];
+
+/*
+ * NOTE: naming convention for macros:
+ *
+ * - SLAP_SOCK_* and SLAP_EVENT_* for public interface that deals
+ *   with file descriptors and events respectively
+ *
+ * - SLAP_<type>_* for private interface; type by now is one of
+ *   EPOLL, DEVPOLL, SELECT
+ *
+ * private interface should not be used in the code.
+ */
+#if defined(HAVE_EPOLL)
+/***************************************
+ * Use epoll infrastructure - epoll(4) *
+ ***************************************/
+# define SLAP_EVENT_FNAME              "epoll"
 # define SLAP_EVENTS_ARE_INDEXED       0
-# define SLAP_SOCK_IX(s)       (slap_daemon.sd_index[(s)])
-# define SLAP_SOCK_EP(s)       (slap_daemon.sd_epolls[SLAP_SOCK_IX(s)])
-# define SLAP_SOCK_EV(s)       (SLAP_SOCK_EP(s).events)
-# define SLAP_SOCK_IS_ACTIVE(s)        (SLAP_SOCK_IX(s) != -1)
-# define SLAP_SOCK_NOT_ACTIVE(s)       (SLAP_SOCK_IX(s) == -1)
-# define SLAP_SOCK_IS_SET(s, mode)     (SLAP_SOCK_EV(s) & (mode))
-
-# define SLAP_SOCK_IS_READ(s)  SLAP_SOCK_IS_SET((s), EPOLLIN)
-# define SLAP_SOCK_IS_WRITE(s) SLAP_SOCK_IS_SET((s), EPOLLOUT)
-
-# define SLAP_SET_SOCK(s, mode) do { \
-       if ((SLAP_SOCK_EV(s) & (mode)) != (mode)) {     \
-               SLAP_SOCK_EV(s) |= (mode); \
-               epoll_ctl(slap_daemon.sd_epfd, EPOLL_CTL_MOD, (s), \
-                       &SLAP_SOCK_EP(s)); \
+# define SLAP_EPOLL_SOCK_IX(t,s)               (slap_daemon[t].sd_index[(s)])
+# define SLAP_EPOLL_SOCK_EP(t,s)               (slap_daemon[t].sd_epolls[SLAP_EPOLL_SOCK_IX(t,s)])
+# define SLAP_EPOLL_SOCK_EV(t,s)               (SLAP_EPOLL_SOCK_EP(t,s).events)
+# define SLAP_SOCK_IS_ACTIVE(t,s)              (SLAP_EPOLL_SOCK_IX(t,s) != -1)
+# define SLAP_SOCK_NOT_ACTIVE(t,s)     (SLAP_EPOLL_SOCK_IX(t,s) == -1)
+# define SLAP_EPOLL_SOCK_IS_SET(t,s, mode)     (SLAP_EPOLL_SOCK_EV(t,s) & (mode))
+
+# define SLAP_SOCK_IS_READ(t,s)                SLAP_EPOLL_SOCK_IS_SET(t,(s), EPOLLIN)
+# define SLAP_SOCK_IS_WRITE(t,s)               SLAP_EPOLL_SOCK_IS_SET(t,(s), EPOLLOUT)
+
+# define SLAP_EPOLL_SOCK_SET(t,s, mode)        do { \
+       if ( (SLAP_EPOLL_SOCK_EV(t,s) & (mode)) != (mode) ) {   \
+               SLAP_EPOLL_SOCK_EV(t,s) |= (mode); \
+               epoll_ctl( slap_daemon[t].sd_epfd, EPOLL_CTL_MOD, (s), \
+                       &SLAP_EPOLL_SOCK_EP(t,s) ); \
        } \
-} while(0)
+} while (0)
 
-# define SLAP_CLR_SOCK(s, mode) do { \
-       if ((SLAP_SOCK_EV(s) & (mode))) { \
-               SLAP_SOCK_EV(s) &= ~(mode);     \
-               epoll_ctl(slap_daemon.sd_epfd, EPOLL_CTL_MOD, s, \
-                       &SLAP_SOCK_EP(s)); \
+# define SLAP_EPOLL_SOCK_CLR(t,s, mode)        do { \
+       if ( (SLAP_EPOLL_SOCK_EV(t,s) & (mode)) ) { \
+               SLAP_EPOLL_SOCK_EV(t,s) &= ~(mode);     \
+               epoll_ctl( slap_daemon[t].sd_epfd, EPOLL_CTL_MOD, s, \
+                       &SLAP_EPOLL_SOCK_EP(t,s) ); \
        } \
-} while(0)
+} while (0)
 
-# define SLAP_SOCK_SET_READ(s) SLAP_SET_SOCK(s, EPOLLIN)
-# define SLAP_SOCK_SET_WRITE(s)        SLAP_SET_SOCK(s, EPOLLOUT)
+# define SLAP_SOCK_SET_READ(t,s)               SLAP_EPOLL_SOCK_SET(t,s, EPOLLIN)
+# define SLAP_SOCK_SET_WRITE(t,s)              SLAP_EPOLL_SOCK_SET(t,s, EPOLLOUT)
 
-# ifdef SLAP_LIGHTWEIGHT_DISPATCHER
-#  define SLAP_SOCK_SET_SUSPEND(s) \
-       ( slap_daemon.sd_suspend[SLAP_SOCK_IX(s)] = 1 )
-#  define SLAP_SOCK_CLR_SUSPEND(s) \
-       ( slap_daemon.sd_suspend[SLAP_SOCK_IX(s)] = 0 )
-#  define SLAP_SOCK_IS_SUSPEND(s) \
-       ( slap_daemon.sd_suspend[SLAP_SOCK_IX(s)] == 1 )
-# endif
+# define SLAP_SOCK_CLR_READ(t,s)               SLAP_EPOLL_SOCK_CLR(t,(s), EPOLLIN)
+# define SLAP_SOCK_CLR_WRITE(t,s)              SLAP_EPOLL_SOCK_CLR(t,(s), EPOLLOUT)
 
-# define SLAP_SOCK_CLR_READ(s) SLAP_CLR_SOCK((s), EPOLLIN)
-# define SLAP_SOCK_CLR_WRITE(s)        SLAP_CLR_SOCK((s), EPOLLOUT)
+#  define SLAP_SOCK_SET_SUSPEND(t,s) \
+       ( slap_daemon[t].sd_suspend[SLAP_EPOLL_SOCK_IX(t,s)] = 1 )
+#  define SLAP_SOCK_CLR_SUSPEND(t,s) \
+       ( slap_daemon[t].sd_suspend[SLAP_EPOLL_SOCK_IX(t,s)] = 0 )
+#  define SLAP_SOCK_IS_SUSPEND(t,s) \
+       ( slap_daemon[t].sd_suspend[SLAP_EPOLL_SOCK_IX(t,s)] == 1 )
 
-# define SLAP_CLR_EVENT(i, mode)       (revents[(i)].events &= ~(mode))
+# define SLAP_EPOLL_EVENT_CLR(i, mode) (revents[(i)].events &= ~(mode))
 
-# define SLAP_EVENT_MAX        slap_daemon.sd_nfds
+# define SLAP_EVENT_MAX(t)                     slap_daemon[t].sd_nfds
 
 /* If a Listener address is provided, store that as the epoll data.
  * Otherwise, store the address of this socket's slot in the
  * index array. If we can't do this add, the system is out of
  * resources and we need to shutdown.
  */
-# define SLAP_ADD_SOCK(s, l) do { \
+# define SLAP_SOCK_ADD(t, s, l)                do { \
        int rc; \
-       SLAP_SOCK_IX((s)) = slap_daemon.sd_nfds; \
-       SLAP_SOCK_EP((s)).data.ptr = (l) ? (l) : (void *)(&SLAP_SOCK_IX(s)); \
-       SLAP_SOCK_EV((s)) = EPOLLIN; \
-       rc = epoll_ctl(slap_daemon.sd_epfd, EPOLL_CTL_ADD, \
-               (s), &SLAP_SOCK_EP((s))); \
+       SLAP_EPOLL_SOCK_IX(t,(s)) = slap_daemon[t].sd_nfds; \
+       SLAP_EPOLL_SOCK_EP(t,(s)).data.ptr = (l) ? (l) : (void *)(&SLAP_EPOLL_SOCK_IX(t,s)); \
+       SLAP_EPOLL_SOCK_EV(t,(s)) = EPOLLIN; \
+       rc = epoll_ctl(slap_daemon[t].sd_epfd, EPOLL_CTL_ADD, \
+               (s), &SLAP_EPOLL_SOCK_EP(t,(s))); \
        if ( rc == 0 ) { \
-               slap_daemon.sd_nfds++; \
+               slap_daemon[t].sd_nfds++; \
        } else { \
                Debug( LDAP_DEBUG_ANY, \
                        "daemon: epoll_ctl(ADD,fd=%d) failed, errno=%d, shutting down\n", \
@@ -196,138 +241,424 @@ static struct slap_daemon {
        } \
 } while (0)
 
-# define SLAP_EV_LISTENER(ptr) (((int *)(ptr) >= slap_daemon.sd_index && \
-       (int *)(ptr) <= (slap_daemon.sd_index+dtblsize)) ? 0 : 1 )
+# define SLAP_EPOLL_EV_LISTENER(t,ptr) \
+       (((int *)(ptr) >= slap_daemon[t].sd_index && \
+       (int *)(ptr) <= &slap_daemon[t].sd_index[dtblsize]) ? 0 : 1 )
 
-# define SLAP_EV_PTRFD(ptr) (SLAP_EV_LISTENER(ptr) ? \
-       ((Listener *)ptr)->sl_sd : (int *)(ptr) - slap_daemon.sd_index)
+# define SLAP_EPOLL_EV_PTRFD(t,ptr)            (SLAP_EPOLL_EV_LISTENER(t,ptr) ? \
+       ((Listener *)ptr)->sl_sd : \
+       (ber_socket_t) ((int *)(ptr) - slap_daemon[t].sd_index))
 
-# define SLAP_DEL_SOCK(s) do { \
-       int fd, rc, index = SLAP_SOCK_IX((s)); \
+# define SLAP_SOCK_DEL(t,s)            do { \
+       int fd, rc, index = SLAP_EPOLL_SOCK_IX(t,(s)); \
        if ( index < 0 ) break; \
-       rc = epoll_ctl(slap_daemon.sd_epfd, EPOLL_CTL_DEL, \
-               (s), &SLAP_SOCK_EP((s))); \
-       slap_daemon.sd_epolls[index] = \
-               slap_daemon.sd_epolls[slap_daemon.sd_nfds-1]; \
-       fd = SLAP_EV_PTRFD(slap_daemon.sd_epolls[index].data.ptr); \
-       slap_daemon.sd_index[fd] = index; \
-       slap_daemon.sd_index[(s)] = -1; \
-       slap_daemon.sd_nfds--; \
+       rc = epoll_ctl(slap_daemon[t].sd_epfd, EPOLL_CTL_DEL, \
+               (s), &SLAP_EPOLL_SOCK_EP(t,(s))); \
+       slap_daemon[t].sd_epolls[index] = \
+               slap_daemon[t].sd_epolls[slap_daemon[t].sd_nfds-1]; \
+       fd = SLAP_EPOLL_EV_PTRFD(t,slap_daemon[t].sd_epolls[index].data.ptr); \
+       slap_daemon[t].sd_index[fd] = index; \
+       slap_daemon[t].sd_index[(s)] = -1; \
+       slap_daemon[t].sd_nfds--; \
 } while (0)
 
-# define SLAP_EVENT_CLR_READ(i)        SLAP_CLR_EVENT((i), EPOLLIN)
-# define SLAP_EVENT_CLR_WRITE(i)       SLAP_CLR_EVENT((i), EPOLLOUT)
+# define SLAP_EVENT_CLR_READ(i)                SLAP_EPOLL_EVENT_CLR((i), EPOLLIN)
+# define SLAP_EVENT_CLR_WRITE(i)       SLAP_EPOLL_EVENT_CLR((i), EPOLLOUT)
 
-# define SLAP_CHK_EVENT(i, mode)       (revents[(i)].events & mode)
+# define SLAP_EPOLL_EVENT_CHK(i, mode) (revents[(i)].events & mode)
 
-# define SLAP_EVENT_IS_READ(i) SLAP_CHK_EVENT((i), EPOLLIN)
-# define SLAP_EVENT_IS_WRITE(i)        SLAP_CHK_EVENT((i), EPOLLOUT)
-# define SLAP_EVENT_IS_LISTENER(i)     SLAP_EV_LISTENER(revents[(i)].data.ptr)
-# define SLAP_EVENT_LISTENER(i)        ((Listener *)(revents[(i)].data.ptr))
+# define SLAP_EVENT_IS_READ(i)         SLAP_EPOLL_EVENT_CHK((i), EPOLLIN)
+# define SLAP_EVENT_IS_WRITE(i)                SLAP_EPOLL_EVENT_CHK((i), EPOLLOUT)
+# define SLAP_EVENT_IS_LISTENER(t,i)   SLAP_EPOLL_EV_LISTENER(t,revents[(i)].data.ptr)
+# define SLAP_EVENT_LISTENER(t,i)              ((Listener *)(revents[(i)].data.ptr))
 
-# define SLAP_EVENT_FD(i)      SLAP_EV_PTRFD(revents[(i)].data.ptr)
+# define SLAP_EVENT_FD(t,i)            SLAP_EPOLL_EV_PTRFD(t,revents[(i)].data.ptr)
 
-# define SLAP_SOCK_SET_INIT do { \
-       slap_daemon.sd_epolls = ch_calloc(1, \
-               sizeof(struct epoll_event) * dtblsize * 2); \
-       slap_daemon.sd_index = ch_malloc(sizeof(int) * dtblsize); \
-       slap_daemon.sd_epfd = epoll_create( dtblsize ); \
-       for (i=0; i<dtblsize; i++) slap_daemon.sd_index[i] = -1; \
+# define SLAP_SOCK_INIT(t)             do { \
+       int j; \
+       slap_daemon[t].sd_epolls = ch_calloc(1, \
+               ( sizeof(struct epoll_event) * 2 \
+                       + sizeof(int) ) * dtblsize * 2); \
+       slap_daemon[t].sd_index = (int *)&slap_daemon[t].sd_epolls[ 2 * dtblsize ]; \
+       slap_daemon[t].sd_epfd = epoll_create( dtblsize / slapd_daemon_threads ); \
+       for ( j = 0; j < dtblsize; j++ ) slap_daemon[t].sd_index[j] = -1; \
 } while (0)
 
-#define SLAP_SOCK_SET_DESTROY do { \
-       if ( slap_daemon.sd_epolls != NULL ) { \
-               ch_free( slap_daemon.sd_epolls ); \
-               slap_daemon.sd_epolls = NULL; \
-               ch_free( slap_daemon.sd_index ); \
-               slap_daemon.sd_index = NULL; \
-               close( slap_daemon.sd_epfd ); \
+# define SLAP_SOCK_DESTROY(t)          do { \
+       if ( slap_daemon[t].sd_epolls != NULL ) { \
+               ch_free( slap_daemon[t].sd_epolls ); \
+               slap_daemon[t].sd_epolls = NULL; \
+               slap_daemon[t].sd_index = NULL; \
+               close( slap_daemon[t].sd_epfd ); \
        } \
 } while ( 0 )
 
-# define SLAP_EVENT_DECL struct epoll_event *revents
+# define SLAP_EVENT_DECL               struct epoll_event *revents
+
+# define SLAP_EVENT_INIT(t)            do { \
+       revents = slap_daemon[t].sd_epolls + dtblsize; \
+} while (0)
 
-# define SLAP_EVENT_INIT do { \
-       revents = slap_daemon.sd_epolls + dtblsize; \
+# define SLAP_EVENT_WAIT(t, tvp, nsp)  do { \
+       *(nsp) = epoll_wait( slap_daemon[t].sd_epfd, revents, \
+               dtblsize, (tvp) ? (tvp)->tv_sec * 1000 : -1 ); \
 } while (0)
 
-# define SLAP_EVENT_WAIT(tvp) \
-       epoll_wait( slap_daemon.sd_epfd, revents, \
-               dtblsize, (tvp) ? (tvp)->tv_sec * 1000 : -1 )
+#elif defined(SLAP_X_DEVPOLL) && defined(HAVE_DEVPOLL)
 
-#else
-/* select */
+/*************************************************************
+ * Use Solaris' (>= 2.7) /dev/poll infrastructure - poll(7d) *
+ *************************************************************/
+# define SLAP_EVENT_FNAME              "/dev/poll"
+# define SLAP_EVENTS_ARE_INDEXED       0
+/*
+ * - sd_index  is used much like with epoll()
+ * - sd_l      is maintained as an array containing the address
+ *             of the listener; the index is the fd itself
+ * - sd_pollfd is used to keep track of what data has been
+ *             registered in /dev/poll
+ */
+# define SLAP_DEVPOLL_SOCK_IX(t,s)     (slap_daemon[t].sd_index[(s)])
+# define SLAP_DEVPOLL_SOCK_LX(t,s)     (slap_daemon[t].sd_l[(s)])
+# define SLAP_DEVPOLL_SOCK_EP(t,s)     (slap_daemon[t].sd_pollfd[SLAP_DEVPOLL_SOCK_IX(t,(s))])
+# define SLAP_DEVPOLL_SOCK_FD(t,s)     (SLAP_DEVPOLL_SOCK_EP(t,(s)).fd)
+# define SLAP_DEVPOLL_SOCK_EV(t,s)     (SLAP_DEVPOLL_SOCK_EP(t,(s)).events)
+# define SLAP_SOCK_IS_ACTIVE(t,s)              (SLAP_DEVPOLL_SOCK_IX(t,(s)) != -1)
+# define SLAP_SOCK_NOT_ACTIVE(t,s)     (SLAP_DEVPOLL_SOCK_IX(t,(s)) == -1)
+# define SLAP_SOCK_IS_SET(t,s, mode)   (SLAP_DEVPOLL_SOCK_EV(t,(s)) & (mode))
+
+# define SLAP_SOCK_IS_READ(t,s)                SLAP_SOCK_IS_SET(t,(s), POLLIN)
+# define SLAP_SOCK_IS_WRITE(t,s)               SLAP_SOCK_IS_SET(t,(s), POLLOUT)
+
+/* as far as I understand, any time we need to communicate with the kernel
+ * about the number and/or properties of a file descriptor we need it to
+ * wait for, we have to rewrite the whole set */
+# define SLAP_DEVPOLL_WRITE_POLLFD(t,s, pfd, n, what, shdn)    do { \
+       int rc; \
+       size_t size = (n) * sizeof( struct pollfd ); \
+       /* FIXME: use pwrite? */ \
+       rc = write( slap_daemon[t].sd_dpfd, (pfd), size ); \
+       if ( rc != size ) { \
+               Debug( LDAP_DEBUG_ANY, "daemon: " SLAP_EVENT_FNAME ": " \
+                       "%s fd=%d failed errno=%d\n", \
+                       (what), (s), errno ); \
+               if ( (shdn) ) { \
+                       slapd_shutdown = 2; \
+               } \
+       } \
+} while (0)
+
+# define SLAP_DEVPOLL_SOCK_SET(t,s, mode)      do { \
+       Debug( LDAP_DEBUG_CONNS, "SLAP_SOCK_SET_%s(%d)=%d\n", \
+               (mode) == POLLIN ? "READ" : "WRITE", (s), \
+               ( (SLAP_DEVPOLL_SOCK_EV(t,(s)) & (mode)) != (mode) ) ); \
+       if ( (SLAP_DEVPOLL_SOCK_EV(t,(s)) & (mode)) != (mode) ) { \
+               struct pollfd pfd; \
+               SLAP_DEVPOLL_SOCK_EV(t,(s)) |= (mode); \
+               pfd.fd = SLAP_DEVPOLL_SOCK_FD(t,(s)); \
+               pfd.events = /* (mode) */ SLAP_DEVPOLL_SOCK_EV(t,(s)); \
+               SLAP_DEVPOLL_WRITE_POLLFD(t,(s), &pfd, 1, "SET", 0); \
+       } \
+} while (0)
+
+# define SLAP_DEVPOLL_SOCK_CLR(t,s, mode)              do { \
+       Debug( LDAP_DEBUG_CONNS, "SLAP_SOCK_CLR_%s(%d)=%d\n", \
+               (mode) == POLLIN ? "READ" : "WRITE", (s), \
+               ( (SLAP_DEVPOLL_SOCK_EV(t,(s)) & (mode)) == (mode) ) ); \
+       if ((SLAP_DEVPOLL_SOCK_EV(t,(s)) & (mode)) == (mode) ) { \
+               struct pollfd pfd[2]; \
+               SLAP_DEVPOLL_SOCK_EV(t,(s)) &= ~(mode); \
+               pfd[0].fd = SLAP_DEVPOLL_SOCK_FD(t,(s)); \
+               pfd[0].events = POLLREMOVE; \
+               pfd[1] = SLAP_DEVPOLL_SOCK_EP(t,(s)); \
+               SLAP_DEVPOLL_WRITE_POLLFD(t,(s), &pfd[0], 2, "CLR", 0); \
+       } \
+} while (0)
+
+# define SLAP_SOCK_SET_READ(t,s)               SLAP_DEVPOLL_SOCK_SET(t,s, POLLIN)
+# define SLAP_SOCK_SET_WRITE(t,s)              SLAP_DEVPOLL_SOCK_SET(t,s, POLLOUT)
+
+# define SLAP_SOCK_CLR_READ(t,s)               SLAP_DEVPOLL_SOCK_CLR(t,(s), POLLIN)
+# define SLAP_SOCK_CLR_WRITE(t,s)              SLAP_DEVPOLL_SOCK_CLR(t,(s), POLLOUT)
+
+#  define SLAP_SOCK_SET_SUSPEND(t,s) \
+       ( slap_daemon[t].sd_suspend[SLAP_DEVPOLL_SOCK_IX(t,(s))] = 1 )
+#  define SLAP_SOCK_CLR_SUSPEND(t,s) \
+       ( slap_daemon[t].sd_suspend[SLAP_DEVPOLL_SOCK_IX(t,(s))] = 0 )
+#  define SLAP_SOCK_IS_SUSPEND(t,s) \
+       ( slap_daemon[t].sd_suspend[SLAP_DEVPOLL_SOCK_IX(t,(s))] == 1 )
+
+# define SLAP_DEVPOLL_EVENT_CLR(i, mode)       (revents[(i)].events &= ~(mode))
 
-# define SLAP_EVENTS_ARE_INDEXED 1
-# define SLAP_EVENT_DECL       \
-       fd_set readfds, writefds
+# define SLAP_EVENT_MAX(t)                     slap_daemon[t].sd_nfds
 
-# define SLAP_EVENT_INIT do { \
-       AC_MEMCPY( &readfds, &slap_daemon.sd_readers, sizeof(fd_set) ); \
+/* If a Listener address is provided, store that in the sd_l array.
+ * If we can't do this add, the system is out of resources and we 
+ * need to shutdown.
+ */
+# define SLAP_SOCK_ADD(t, s, l)                do { \
+       Debug( LDAP_DEBUG_CONNS, "SLAP_SOCK_ADD(%d, %p)\n", (s), (l), 0 ); \
+       SLAP_DEVPOLL_SOCK_IX(t,(s)) = slap_daemon[t].sd_nfds; \
+       SLAP_DEVPOLL_SOCK_LX(t,(s)) = (l); \
+       SLAP_DEVPOLL_SOCK_FD(t,(s)) = (s); \
+       SLAP_DEVPOLL_SOCK_EV(t,(s)) = POLLIN; \
+       SLAP_DEVPOLL_WRITE_POLLFD(t,(s), &SLAP_DEVPOLL_SOCK_EP((s)), 1, "ADD", 1); \
+       slap_daemon[t].sd_nfds++; \
+} while (0)
+
+# define SLAP_DEVPOLL_EV_LISTENER(ptr) ((ptr) != NULL)
+
+# define SLAP_SOCK_DEL(t,s)            do { \
+       int fd, index = SLAP_DEVPOLL_SOCK_IX(t,(s)); \
+       Debug( LDAP_DEBUG_CONNS, "SLAP_SOCK_DEL(%d)\n", (s), 0, 0 ); \
+       if ( index < 0 ) break; \
+       if ( index < slap_daemon[t].sd_nfds - 1 ) { \
+               struct pollfd pfd = slap_daemon[t].sd_pollfd[index]; \
+               fd = slap_daemon[t].sd_pollfd[slap_daemon[t].sd_nfds - 1].fd; \
+               slap_daemon[t].sd_pollfd[index] = slap_daemon[t].sd_pollfd[slap_daemon[t].sd_nfds - 1]; \
+               slap_daemon[t].sd_pollfd[slap_daemon[t].sd_nfds - 1] = pfd; \
+               slap_daemon[t].sd_index[fd] = index; \
+       } \
+       slap_daemon[t].sd_index[(s)] = -1; \
+       slap_daemon[t].sd_pollfd[slap_daemon[t].sd_nfds - 1].events = POLLREMOVE; \
+       SLAP_DEVPOLL_WRITE_POLLFD(t,(s), &slap_daemon[t].sd_pollfd[slap_daemon[t].sd_nfds - 1], 1, "DEL", 0); \
+       slap_daemon[t].sd_pollfd[slap_daemon[t].sd_nfds - 1].events = 0; \
+       slap_daemon[t].sd_nfds--; \
+} while (0)
+
+# define SLAP_EVENT_CLR_READ(i)                SLAP_DEVPOLL_EVENT_CLR((i), POLLIN)
+# define SLAP_EVENT_CLR_WRITE(i)       SLAP_DEVPOLL_EVENT_CLR((i), POLLOUT)
+
+# define SLAP_DEVPOLL_EVENT_CHK(i, mode)       (revents[(i)].events & (mode))
+
+# define SLAP_EVENT_FD(t,i)            (revents[(i)].fd)
+
+# define SLAP_EVENT_IS_READ(i)         SLAP_DEVPOLL_EVENT_CHK((i), POLLIN)
+# define SLAP_EVENT_IS_WRITE(i)                SLAP_DEVPOLL_EVENT_CHK((i), POLLOUT)
+# define SLAP_EVENT_IS_LISTENER(t,i)   SLAP_DEVPOLL_EV_LISTENER(SLAP_DEVPOLL_SOCK_LX(SLAP_EVENT_FD(t,(i))))
+# define SLAP_EVENT_LISTENER(t,i)              SLAP_DEVPOLL_SOCK_LX(SLAP_EVENT_FD(t,(i)))
+
+# define SLAP_SOCK_INIT(t)             do { \
+       slap_daemon[t].sd_pollfd = ch_calloc( 1, \
+               ( sizeof(struct pollfd) * 2 \
+                       + sizeof( int ) \
+                       + sizeof( Listener * ) ) * dtblsize ); \
+       slap_daemon[t].sd_index = (int *)&slap_daemon[t].sd_pollfd[ 2 * dtblsize ]; \
+       slap_daemon[t].sd_l = (Listener **)&slap_daemon[t].sd_index[ dtblsize ]; \
+       slap_daemon[t].sd_dpfd = open( SLAP_EVENT_FNAME, O_RDWR ); \
+       if ( slap_daemon[t].sd_dpfd == -1 ) { \
+               Debug( LDAP_DEBUG_ANY, "daemon: " SLAP_EVENT_FNAME ": " \
+                       "open(\"" SLAP_EVENT_FNAME "\") failed errno=%d\n", \
+                       errno, 0, 0 ); \
+               SLAP_SOCK_DESTROY; \
+               return -1; \
+       } \
+       for ( i = 0; i < dtblsize; i++ ) { \
+               slap_daemon[t].sd_pollfd[i].fd = -1; \
+               slap_daemon[t].sd_index[i] = -1; \
+       } \
+} while (0)
+
+# define SLAP_SOCK_DESTROY(t)          do { \
+       if ( slap_daemon[t].sd_pollfd != NULL ) { \
+               ch_free( slap_daemon[t].sd_pollfd ); \
+               slap_daemon[t].sd_pollfd = NULL; \
+               slap_daemon[t].sd_index = NULL; \
+               slap_daemon[t].sd_l = NULL; \
+               close( slap_daemon[t].sd_dpfd ); \
+       } \
+} while ( 0 )
+
+# define SLAP_EVENT_DECL               struct pollfd *revents
+
+# define SLAP_EVENT_INIT(t)            do { \
+       revents = &slap_daemon[t].sd_pollfd[ dtblsize ]; \
+} while (0)
+
+# define SLAP_EVENT_WAIT(t, tvp, nsp)  do { \
+       struct dvpoll           sd_dvpoll; \
+       sd_dvpoll.dp_timeout = (tvp) ? (tvp)->tv_sec * 1000 : -1; \
+       sd_dvpoll.dp_nfds = dtblsize; \
+       sd_dvpoll.dp_fds = revents; \
+       *(nsp) = ioctl( slap_daemon[t].sd_dpfd, DP_POLL, &sd_dvpoll ); \
+} while (0)
+
+#else /* ! epoll && ! /dev/poll */
+# ifdef HAVE_WINSOCK
+# define SLAP_EVENT_FNAME              "WSselect"
+/* Winsock provides a "select" function but its fd_sets are
+ * actually arrays of sockets. Since these sockets are handles
+ * and not a contiguous range of small integers, we manage our
+ * own "fd" table of socket handles and use their indices as
+ * descriptors.
+ *
+ * All of our listener/connection structures use fds; the actual
+ * I/O functions use sockets. The SLAP_FD2SOCK macro in proto-slap.h
+ * handles the mapping.
+ *
+ * Despite the mapping overhead, this is about 45% more efficient
+ * than just using Winsock's select and FD_ISSET directly.
+ *
+ * Unfortunately Winsock's select implementation doesn't scale well
+ * as the number of connections increases. This probably needs to be
+ * rewritten to use the Winsock overlapped/asynchronous I/O functions.
+ */
+# define SLAP_EVENTS_ARE_INDEXED       1
+# define SLAP_EVENT_DECL               fd_set readfds, writefds; char *rflags
+# define SLAP_EVENT_INIT(t)    do { \
+       int i; \
+       FD_ZERO( &readfds ); \
+       FD_ZERO( &writefds ); \
+       rflags = slap_daemon[t].sd_rflags; \
+       memset( rflags, 0, slap_daemon[t].sd_nfds ); \
+       for ( i=0; i<slap_daemon[t].sd_nfds; i++ ) { \
+               if ( slap_daemon[t].sd_flags[i] & SD_READ ) \
+                       FD_SET( slapd_ws_sockets[i], &readfds );\
+               if ( slap_daemon[t].sd_flags[i] & SD_WRITE ) \
+                       FD_SET( slapd_ws_sockets[i], &writefds ); \
+       } } while ( 0 )
+
+# define SLAP_EVENT_MAX(t)             slap_daemon[t].sd_nfds
+
+# define SLAP_EVENT_WAIT(t, tvp, nsp)  do { \
+       int i; \
+       *(nsp) = select( SLAP_EVENT_MAX(t), &readfds, \
+               nwriters > 0 ? &writefds : NULL, NULL, (tvp) ); \
+       for ( i=0; i<readfds.fd_count; i++) { \
+               int fd = slapd_sock2fd(readfds.fd_array[i]); \
+               if ( fd >= 0 ) { \
+                       slap_daemon[t].sd_rflags[fd] = SD_READ; \
+                       if ( fd >= *(nsp)) *(nsp) = fd+1; \
+               } \
+       } \
+       for ( i=0; i<writefds.fd_count; i++) { \
+               int fd = slapd_sock2fd(writefds.fd_array[i]); \
+               if ( fd >= 0 ) { \
+                       slap_daemon[t].sd_rflags[fd] = SD_WRITE; \
+                       if ( fd >= *(nsp)) *(nsp) = fd+1; \
+               } \
+       } \
+} while (0)
+
+# define SLAP_EVENT_IS_READ(fd)                (rflags[fd] & SD_READ)
+# define SLAP_EVENT_IS_WRITE(fd)       (rflags[fd] & SD_WRITE)
+
+# define SLAP_EVENT_CLR_READ(fd)       rflags[fd] &= ~SD_READ
+# define SLAP_EVENT_CLR_WRITE(fd)      rflags[fd] &= ~SD_WRITE
+
+# define SLAP_SOCK_INIT(t)             do { \
+       if (!t) { \
+       ldap_pvt_thread_mutex_init( &slapd_ws_mutex ); \
+       slapd_ws_sockets = ch_malloc( dtblsize * ( sizeof(SOCKET) + 2)); \
+       memset( slapd_ws_sockets, -1, dtblsize * sizeof(SOCKET) ); \
+       } \
+       slap_daemon[t].sd_flags = (char *)(slapd_ws_sockets + dtblsize); \
+       slap_daemon[t].sd_rflags = slap_daemon[t].sd_flags + dtblsize; \
+       memset( slap_daemon[t].sd_flags, 0, dtblsize ); \
+       slapd_ws_sockets[t*2] = wake_sds[t][0]; \
+       slapd_ws_sockets[t*2+1] = wake_sds[t][1]; \
+       wake_sds[t][0] = t*2; \
+       wake_sds[t][1] = t*2+1; \
+       slap_daemon[t].sd_nfds = t*2 + 2; \
+       } while ( 0 )
+
+# define SLAP_SOCK_DESTROY(t)  do { \
+       ch_free( slapd_ws_sockets ); slapd_ws_sockets = NULL; \
+       slap_daemon[t].sd_flags = NULL; \
+       slap_daemon[t].sd_rflags = NULL; \
+       ldap_pvt_thread_mutex_destroy( &slapd_ws_mutex ); \
+       } while ( 0 )
+
+# define SLAP_SOCK_IS_ACTIVE(t,fd) ( slap_daemon[t].sd_flags[fd] & SD_ACTIVE )
+# define SLAP_SOCK_IS_READ(t,fd) ( slap_daemon[t].sd_flags[fd] & SD_READ )
+# define SLAP_SOCK_IS_WRITE(t,fd) ( slap_daemon[t].sd_flags[fd] & SD_WRITE )
+# define SLAP_SOCK_NOT_ACTIVE(t,fd)    (!slap_daemon[t].sd_flags[fd])
+
+# define SLAP_SOCK_SET_READ(t,fd)              ( slap_daemon[t].sd_flags[fd] |= SD_READ )
+# define SLAP_SOCK_SET_WRITE(t,fd)             ( slap_daemon[t].sd_flags[fd] |= SD_WRITE )
+
+# define SLAP_SELECT_ADDTEST(t,s)      do { \
+       if ((s) >= slap_daemon[t].sd_nfds) slap_daemon[t].sd_nfds = (s)+1; \
+} while (0)
+
+# define SLAP_SOCK_CLR_READ(t,fd)              ( slap_daemon[t].sd_flags[fd] &= ~SD_READ )
+# define SLAP_SOCK_CLR_WRITE(t,fd)             ( slap_daemon[t].sd_flags[fd] &= ~SD_WRITE )
+
+# define SLAP_SOCK_ADD(t,s, l) do { \
+       SLAP_SELECT_ADDTEST(t,(s)); \
+       slap_daemon[t].sd_flags[s] = SD_ACTIVE|SD_READ; \
+} while ( 0 )
+
+# define SLAP_SOCK_DEL(t,s) do { \
+       slap_daemon[t].sd_flags[s] = 0; \
+       slapd_sockdel( s ); \
+} while ( 0 )
+
+# else /* !HAVE_WINSOCK */
+
+/**************************************
+ * Use select system call - select(2) *
+ **************************************/
+# define SLAP_EVENT_FNAME              "select"
+/* select */
+# define SLAP_EVENTS_ARE_INDEXED       1
+# define SLAP_EVENT_DECL               fd_set readfds, writefds
+
+# define SLAP_EVENT_INIT(t)            do { \
+       AC_MEMCPY( &readfds, &slap_daemon[t].sd_readers, sizeof(fd_set) );      \
        if ( nwriters ) { \
-               AC_MEMCPY( &writefds, &slap_daemon.sd_writers, sizeof(fd_set) ); \
+               AC_MEMCPY( &writefds, &slap_daemon[t].sd_writers, sizeof(fd_set) ); \
        } else { \
                FD_ZERO( &writefds ); \
        } \
 } while (0)
 
 # ifdef FD_SETSIZE
-#  define      CHK_SETSIZE do { \
+#  define SLAP_SELECT_CHK_SETSIZE      do { \
        if (dtblsize > FD_SETSIZE) dtblsize = FD_SETSIZE; \
 } while (0)
-# else
-#  define       CHK_SETSIZE do { ; } while (0)
-# endif
-
-# define       SLAP_SOCK_SET_INIT do { \
-       CHK_SETSIZE; \
-       FD_ZERO(&slap_daemon.sd_readers); \
-       FD_ZERO(&slap_daemon.sd_writers); \
+# else /* ! FD_SETSIZE */
+#  define SLAP_SELECT_CHK_SETSIZE      do { ; } while (0)
+# endif /* ! FD_SETSIZE */
+
+# define SLAP_SOCK_INIT(t)                     do { \
+       SLAP_SELECT_CHK_SETSIZE; \
+       FD_ZERO(&slap_daemon[t].sd_actives); \
+       FD_ZERO(&slap_daemon[t].sd_readers); \
+       FD_ZERO(&slap_daemon[t].sd_writers); \
 } while (0)
 
-#define                SLAP_SOCK_SET_DESTROY
+# define SLAP_SOCK_DESTROY(t)
 
-# define SLAP_SOCK_IS_ACTIVE(fd)       FD_ISSET((fd), &slap_daemon.sd_actives)
-# define SLAP_SOCK_IS_READ(fd)         FD_ISSET((fd), &slap_daemon.sd_readers)
-# define SLAP_SOCK_IS_WRITE(fd)                FD_ISSET((fd), &slap_daemon.sd_writers)
+# define SLAP_SOCK_IS_ACTIVE(t,fd)     FD_ISSET((fd), &slap_daemon[t].sd_actives)
+# define SLAP_SOCK_IS_READ(t,fd)               FD_ISSET((fd), &slap_daemon[t].sd_readers)
+# define SLAP_SOCK_IS_WRITE(t,fd)              FD_ISSET((fd), &slap_daemon[t].sd_writers)
 
-# define SLAP_SOCK_NOT_ACTIVE(fd)      (!SLAP_SOCK_IS_ACTIVE(fd) && \
-        !SLAP_SOCK_IS_READ(fd) && !SLAP_SOCK_IS_WRITE(fd))
+# define SLAP_SOCK_NOT_ACTIVE(t,fd)    (!SLAP_SOCK_IS_ACTIVE(t,fd) && \
+        !SLAP_SOCK_IS_READ(t,fd) && !SLAP_SOCK_IS_WRITE(t,fd))
 
-# ifdef HAVE_WINSOCK
-#  define SLAP_SOCK_SET_READ(fd)       do { \
-       if (!SLAP_SOCK_IS_READ(fd)) { FD_SET((fd), &slap_daemon.sd_readers); } \
-} while(0)
-#  define SLAP_SOCK_SET_WRITE(fd)      do { \
-       if (!SLAP_SOCK_IS_WRITE(fd)) { FD_SET((fd), &slap_daemon.sd_writers); } \
-} while(0)
-
-#  define SLAP_ADDTEST(s)      
-#  define SLAP_EVENT_MAX       dtblsize
-# else
-#  define SLAP_SOCK_SET_READ(fd)       FD_SET((fd), &slap_daemon.sd_readers)
-#  define SLAP_SOCK_SET_WRITE(fd)      FD_SET((fd), &slap_daemon.sd_writers)
-
-#  define SLAP_EVENT_MAX       slap_daemon.sd_nfds
-#  define SLAP_ADDTEST(s)      do { \
-       if ((s) >= slap_daemon.sd_nfds) slap_daemon.sd_nfds = (s)+1; \
+# define SLAP_SOCK_SET_READ(t,fd)      FD_SET((fd), &slap_daemon[t].sd_readers)
+# define SLAP_SOCK_SET_WRITE(t,fd)     FD_SET((fd), &slap_daemon[t].sd_writers)
+
+# define SLAP_EVENT_MAX(t)             slap_daemon[t].sd_nfds
+# define SLAP_SELECT_ADDTEST(t,s)      do { \
+       if ((s) >= slap_daemon[t].sd_nfds) slap_daemon[t].sd_nfds = (s)+1; \
 } while (0)
-# endif
 
-# define SLAP_SOCK_CLR_READ(fd)                FD_CLR((fd), &slap_daemon.sd_readers)
-# define SLAP_SOCK_CLR_WRITE(fd)       FD_CLR((fd), &slap_daemon.sd_writers)
+# define SLAP_SOCK_CLR_READ(t,fd)              FD_CLR((fd), &slap_daemon[t].sd_readers)
+# define SLAP_SOCK_CLR_WRITE(t,fd)     FD_CLR((fd), &slap_daemon[t].sd_writers)
 
-# define SLAP_ADD_SOCK(s, l) do { \
-       SLAP_ADDTEST((s)); \
-       FD_SET((s), &slap_daemon.sd_actives); \
-       FD_SET((s), &slap_daemon.sd_readers); \
-} while(0)
+# define SLAP_SOCK_ADD(t,s, l)         do { \
+       SLAP_SELECT_ADDTEST(t,(s)); \
+       FD_SET((s), &slap_daemon[t].sd_actives); \
+       FD_SET((s), &slap_daemon[t].sd_readers); \
+} while (0)
 
-# define SLAP_DEL_SOCK(s) do { \
-       FD_CLR((s), &slap_daemon.sd_actives); \
-       FD_CLR((s), &slap_daemon.sd_readers); \
-       FD_CLR((s), &slap_daemon.sd_writers); \
-} while(0)
+# define SLAP_SOCK_DEL(t,s)            do { \
+       FD_CLR((s), &slap_daemon[t].sd_actives); \
+       FD_CLR((s), &slap_daemon[t].sd_readers); \
+       FD_CLR((s), &slap_daemon[t].sd_writers); \
+} while (0)
 
 # define SLAP_EVENT_IS_READ(fd)                FD_ISSET((fd), &readfds)
 # define SLAP_EVENT_IS_WRITE(fd)       FD_ISSET((fd), &writefds)
@@ -335,10 +666,12 @@ static struct slap_daemon {
 # define SLAP_EVENT_CLR_READ(fd)       FD_CLR((fd), &readfds)
 # define SLAP_EVENT_CLR_WRITE(fd)      FD_CLR((fd), &writefds)
 
-# define SLAP_EVENT_WAIT(tvp) \
-       select( SLAP_EVENT_MAX, &readfds, \
-               nwriters > 0 ? &writefds : NULL, NULL, (tvp) )
-#endif
+# define SLAP_EVENT_WAIT(t, tvp, nsp)  do { \
+       *(nsp) = select( SLAP_EVENT_MAX(t), &readfds, \
+               nwriters > 0 ? &writefds : NULL, NULL, (tvp) ); \
+} while (0)
+# endif /* !HAVE_WINSOCK */
+#endif /* ! epoll && ! /dev/poll */
 
 #ifdef HAVE_SLP
 /*
@@ -355,53 +688,46 @@ const char *slapd_slp_attrs = NULL;
 
 static SLPError slapd_slp_cookie;
 
-void slapd_slp_init( const char* urls ) {
+static void
+slapd_slp_init( const char* urls )
+{
        int i;
        SLPError err;
 
        slapd_srvurls = ldap_str2charray( urls, " " );
 
-       if( slapd_srvurls == NULL ) return;
+       if ( slapd_srvurls == NULL ) return;
 
        /* find and expand INADDR_ANY URLs */
-       for( i=0; slapd_srvurls[i] != NULL; i++ ) {
-               if( strcmp( slapd_srvurls[i], "ldap:///" ) == 0) {
-                       char *host = ldap_pvt_get_fqdn( NULL );
-                       if ( host != NULL ) {
-                               slapd_srvurls[i] = (char *) ch_realloc( slapd_srvurls[i],
-                                       strlen( host ) +
-                                       sizeof( LDAP_SRVTYPE_PREFIX ) );
-                               strcpy( lutil_strcopy(slapd_srvurls[i],
-                                       LDAP_SRVTYPE_PREFIX ), host );
-
-                               ch_free( host );
-                       }
-
-               } else if ( strcmp( slapd_srvurls[i], "ldaps:///" ) == 0) {
-                       char *host = ldap_pvt_get_fqdn( NULL );
-                       if ( host != NULL ) {
-                               slapd_srvurls[i] = (char *) ch_realloc( slapd_srvurls[i],
-                                       strlen( host ) +
-                                       sizeof( LDAPS_SRVTYPE_PREFIX ) );
-                               strcpy( lutil_strcopy(slapd_srvurls[i],
-                                       LDAPS_SRVTYPE_PREFIX ), host );
-
-                               ch_free( host );
-                       }
+       for ( i = 0; slapd_srvurls[i] != NULL; i++ ) {
+               if ( strcmp( slapd_srvurls[i], "ldap:///" ) == 0 ) {
+                       slapd_srvurls[i] = (char *) ch_realloc( slapd_srvurls[i],
+                               global_host_bv.bv_len +
+                               sizeof( LDAP_SRVTYPE_PREFIX ) );
+                       strcpy( lutil_strcopy(slapd_srvurls[i],
+                               LDAP_SRVTYPE_PREFIX ), global_host_bv.bv_val );
+               } else if ( strcmp( slapd_srvurls[i], "ldaps:///" ) == 0 ) {
+                       slapd_srvurls[i] = (char *) ch_realloc( slapd_srvurls[i],
+                               global_host_bv.bv_len +
+                               sizeof( LDAPS_SRVTYPE_PREFIX ) );
+                       strcpy( lutil_strcopy(slapd_srvurls[i],
+                               LDAPS_SRVTYPE_PREFIX ), global_host_bv.bv_val );
                }
        }
 
        /* open the SLP handle */
        err = SLPOpen( "en", 0, &slapd_hslp );
 
-       if (err != SLP_OK) {
+       if ( err != SLP_OK ) {
                Debug( LDAP_DEBUG_CONNS, "daemon: SLPOpen() failed with %ld\n",
                        (long)err, 0, 0 );
        }
 }
 
-void slapd_slp_deinit() {
-       if( slapd_srvurls == NULL ) return;
+static void
+slapd_slp_deinit( void )
+{
+       if ( slapd_srvurls == NULL ) return;
 
        ldap_charray_free( slapd_srvurls );
        slapd_srvurls = NULL;
@@ -410,37 +736,40 @@ void slapd_slp_deinit() {
        SLPClose( slapd_hslp );
 }
 
-void slapd_slp_regreport(
-       SLPHandle hslp,
-       SLPError errcode,
-       void* cookie )
+static void
+slapd_slp_regreport(
+       SLPHandle       hslp,
+       SLPError        errcode,
+       void            *cookie )
 {
        /* return the error code in the cookie */
        *(SLPError*)cookie = errcode; 
 }
 
-void slapd_slp_reg() {
+static void
+slapd_slp_reg()
+{
        int i;
        SLPError err;
 
-       if( slapd_srvurls == NULL ) return;
+       if ( slapd_srvurls == NULL ) return;
 
-       for( i=0; slapd_srvurls[i] != NULL; i++ ) {
-               if( strncmp( slapd_srvurls[i], LDAP_SRVTYPE_PREFIX,
+       for ( i = 0; slapd_srvurls[i] != NULL; i++ ) {
+               if ( strncmp( slapd_srvurls[i], LDAP_SRVTYPE_PREFIX,
                                sizeof( LDAP_SRVTYPE_PREFIX ) - 1 ) == 0 ||
-                   strncmp( slapd_srvurls[i], LDAPS_SRVTYPE_PREFIX,
+                       strncmp( slapd_srvurls[i], LDAPS_SRVTYPE_PREFIX,
                                sizeof( LDAPS_SRVTYPE_PREFIX ) - 1 ) == 0 )
                {
                        err = SLPReg( slapd_hslp,
                                slapd_srvurls[i],
                                SLP_LIFETIME_MAXIMUM,
                                "ldap",
-                                       (slapd_slp_attrs) ? slapd_slp_attrs : "",
-                                       SLP_TRUE,
+                               (slapd_slp_attrs) ? slapd_slp_attrs : "",
+                               SLP_TRUE,
                                slapd_slp_regreport,
-                                       &slapd_slp_cookie );
+                               &slapd_slp_cookie );
 
-                       if (err != SLP_OK || slapd_slp_cookie != SLP_OK) {
+                       if ( err != SLP_OK || slapd_slp_cookie != SLP_OK ) {
                                Debug( LDAP_DEBUG_CONNS,
                                        "daemon: SLPReg(%s) failed with %ld, cookie = %ld\n",
                                        slapd_srvurls[i], (long)err, (long)slapd_slp_cookie );
@@ -449,19 +778,21 @@ void slapd_slp_reg() {
        }
 }
 
-void slapd_slp_dereg() {
+static void
+slapd_slp_dereg( void )
+{
        int i;
        SLPError err;
 
-       if( slapd_srvurls == NULL ) return;
+       if ( slapd_srvurls == NULL ) return;
 
-       for( i=0; slapd_srvurls[i] != NULL; i++ ) {
+       for ( i = 0; slapd_srvurls[i] != NULL; i++ ) {
                err = SLPDereg( slapd_hslp,
                        slapd_srvurls[i],
                        slapd_slp_regreport,
-                               &slapd_slp_cookie );
+                       &slapd_slp_cookie );
                
-               if (err != SLP_OK || slapd_slp_cookie != SLP_OK) {
+               if ( err != SLP_OK || slapd_slp_cookie != SLP_OK ) {
                        Debug( LDAP_DEBUG_CONNS,
                                "daemon: SLPDereg(%s) failed with %ld, cookie = %ld\n",
                                slapd_srvurls[i], (long)err, (long)slapd_slp_cookie );
@@ -470,6 +801,42 @@ void slapd_slp_dereg() {
 }
 #endif /* HAVE_SLP */
 
+#ifdef HAVE_WINSOCK
+/* Manage the descriptor to socket table */
+ber_socket_t
+slapd_socknew( ber_socket_t s )
+{
+       ber_socket_t i;
+       ldap_pvt_thread_mutex_lock( &slapd_ws_mutex );
+       for ( i = 0; i < dtblsize && slapd_ws_sockets[i] != INVALID_SOCKET; i++ );
+       if ( i == dtblsize ) {
+               WSASetLastError( WSAEMFILE );
+       } else {
+               slapd_ws_sockets[i] = s;
+       }
+       ldap_pvt_thread_mutex_unlock( &slapd_ws_mutex );
+       return i;
+}
+
+void
+slapd_sockdel( ber_socket_t s )
+{
+       ldap_pvt_thread_mutex_lock( &slapd_ws_mutex );
+       slapd_ws_sockets[s] = INVALID_SOCKET;
+       ldap_pvt_thread_mutex_unlock( &slapd_ws_mutex );
+}
+
+ber_socket_t
+slapd_sock2fd( ber_socket_t s )
+{
+       ber_socket_t i;
+       for ( i=0; i<dtblsize && slapd_ws_sockets[i] != s; i++);
+       if ( i == dtblsize )
+               i = -1;
+       return i;
+}
+#endif
+
 /*
  * Add a descriptor to daemon control
  *
@@ -479,39 +846,32 @@ void slapd_slp_dereg() {
  * idletimeout. The underlying event handler may record the Listener
  * argument to differentiate Listener's from real sessions.
  */
-static void slapd_add(ber_socket_t s, int isactive, Listener *sl) {
-       ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
-
-       assert( SLAP_SOCK_NOT_ACTIVE(s) );
-
-       if ( isactive ) slap_daemon.sd_nactives++;
+static void
+slapd_add( ber_socket_t s, int isactive, Listener *sl, int id )
+{
+       if (id < 0)
+               id = DAEMON_ID(s);
+       ldap_pvt_thread_mutex_lock( &slap_daemon[id].sd_mutex );
 
-       SLAP_ADD_SOCK(s, sl);
+       assert( SLAP_SOCK_NOT_ACTIVE(id, s) );
 
-       Debug( LDAP_DEBUG_CONNS, "daemon: added %ldr\n",
-               (long) s, 0, 0 );
+       if ( isactive ) slap_daemon[id].sd_nactives++;
 
-       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
+       SLAP_SOCK_ADD(id, s, sl);
 
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
-       WAKE_LISTENER(1);
-#endif
-}
+       Debug( LDAP_DEBUG_CONNS, "daemon: added %ldr%s listener=%p\n",
+               (long) s, isactive ? " (active)" : "", (void *)sl );
 
-void slapd_sd_lock()
-{
-       ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
-}
+       ldap_pvt_thread_mutex_unlock( &slap_daemon[id].sd_mutex );
 
-void slapd_sd_unlock()
-{
-       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
+       WAKE_LISTENER(id,1);
 }
 
 /*
  * Remove the descriptor from daemon control
  */
-void slapd_remove(
+void
+slapd_remove(
        ber_socket_t s,
        Sockbuf *sb,
        int wasactive,
@@ -520,25 +880,26 @@ void slapd_remove(
 {
        int waswriter;
        int wasreader;
+       int id = DAEMON_ID(s);
 
        if ( !locked )
-               ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
+               ldap_pvt_thread_mutex_lock( &slap_daemon[id].sd_mutex );
 
-       assert( SLAP_SOCK_IS_ACTIVE( s ));
+       assert( SLAP_SOCK_IS_ACTIVE( id, s ));
 
-       if ( wasactive ) slap_daemon.sd_nactives--;
+       if ( wasactive ) slap_daemon[id].sd_nactives--;
 
-       waswriter = SLAP_SOCK_IS_WRITE(s);
-       wasreader = SLAP_SOCK_IS_READ(s);
+       waswriter = SLAP_SOCK_IS_WRITE(id, s);
+       wasreader = SLAP_SOCK_IS_READ(id, s);
 
        Debug( LDAP_DEBUG_CONNS, "daemon: removing %ld%s%s\n",
                (long) s,
                wasreader ? "r" : "",
                waswriter ? "w" : "" );
 
-       if ( waswriter ) slap_daemon.sd_nwriters--;
+       if ( waswriter ) slap_daemon[id].sd_nwriters--;
 
-       SLAP_DEL_SOCK(s);
+       SLAP_SOCK_DEL(id, s);
 
        if ( sb )
                ber_sockbuf_free(sb);
@@ -547,7 +908,7 @@ void slapd_remove(
         * the select() loop. Now that we're removing a session from our
         * control, we can try to resume a dropped listener to use.
         */
-       if ( emfile ) {
+       if ( emfile && listening ) {
                int i;
                for ( i = 0; slap_listeners[i] != NULL; i++ ) {
                        Listener *lr = slap_listeners[i];
@@ -557,6 +918,8 @@ void slapd_remove(
                        if ( lr->sl_mute ) {
                                lr->sl_mute = 0;
                                emfile--;
+                               if ( DAEMON_ID(lr->sl_sd) != id )
+                                       WAKE_LISTENER(DAEMON_ID(lr->sl_sd), wake);
                                break;
                        }
                }
@@ -565,69 +928,119 @@ void slapd_remove(
                 */
                if ( slap_listeners[i] == NULL ) emfile = 0;
        }
-       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
-       WAKE_LISTENER(wake || slapd_gentle_shutdown == 2);
+       ldap_pvt_thread_mutex_unlock( &slap_daemon[id].sd_mutex );
+       WAKE_LISTENER(id, wake || slapd_gentle_shutdown == 2);
 }
 
-void slapd_clr_write(ber_socket_t s, int wake) {
-       ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
+void
+slapd_clr_write( ber_socket_t s, int wake )
+{
+       int id = DAEMON_ID(s);
+       ldap_pvt_thread_mutex_lock( &slap_daemon[id].sd_mutex );
 
-       assert( SLAP_SOCK_IS_ACTIVE( s ));
+       if ( SLAP_SOCK_IS_WRITE( id, s )) {
+               assert( SLAP_SOCK_IS_ACTIVE( id, s ));
 
-       if ( SLAP_SOCK_IS_WRITE( s )) {
-               SLAP_SOCK_CLR_WRITE( s );
-               slap_daemon.sd_nwriters--;
+               SLAP_SOCK_CLR_WRITE( id, s );
+               slap_daemon[id].sd_nwriters--;
        }
 
-       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
-       WAKE_LISTENER(wake);
+       ldap_pvt_thread_mutex_unlock( &slap_daemon[id].sd_mutex );
+       WAKE_LISTENER(id,wake);
 }
 
-void slapd_set_write(ber_socket_t s, int wake) {
-       ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
+void
+slapd_set_write( ber_socket_t s, int wake )
+{
+       int id = DAEMON_ID(s);
+       ldap_pvt_thread_mutex_lock( &slap_daemon[id].sd_mutex );
 
-       assert( SLAP_SOCK_IS_ACTIVE( s ));
+       assert( SLAP_SOCK_IS_ACTIVE( id, s ));
 
-       if ( !SLAP_SOCK_IS_WRITE( s )) {
-               SLAP_SOCK_SET_WRITE( s );
-               slap_daemon.sd_nwriters++;
+       if ( !SLAP_SOCK_IS_WRITE( id, s )) {
+               SLAP_SOCK_SET_WRITE( id, s );
+               slap_daemon[id].sd_nwriters++;
+       }
+       if (( wake & 2 ) && global_writetimeout && !chk_writetime ) {
+               if (id)
+                       ldap_pvt_thread_mutex_lock( &slap_daemon[0].sd_mutex );
+               if (!chk_writetime)
+                       chk_writetime = slap_get_time();
+               if (id)
+                       ldap_pvt_thread_mutex_unlock( &slap_daemon[0].sd_mutex );
        }
 
-       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
-       WAKE_LISTENER(wake);
+       ldap_pvt_thread_mutex_unlock( &slap_daemon[id].sd_mutex );
+       WAKE_LISTENER(id,wake);
 }
 
-int slapd_clr_read(ber_socket_t s, int wake) {
+int
+slapd_clr_read( ber_socket_t s, int wake )
+{
        int rc = 1;
-       ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
+       int id = DAEMON_ID(s);
+       ldap_pvt_thread_mutex_lock( &slap_daemon[id].sd_mutex );
 
-       if ( SLAP_SOCK_IS_ACTIVE( s )) {
-               SLAP_SOCK_CLR_READ( s );
+       if ( SLAP_SOCK_IS_ACTIVE( id, s )) {
+               SLAP_SOCK_CLR_READ( id, s );
                rc = 0;
        }
-       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
+       ldap_pvt_thread_mutex_unlock( &slap_daemon[id].sd_mutex );
        if ( !rc )
-               WAKE_LISTENER(wake);
+               WAKE_LISTENER(id,wake);
        return rc;
 }
 
-void slapd_set_read(ber_socket_t s, int wake) {
-       ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
+void
+slapd_set_read( ber_socket_t s, int wake )
+{
+       int do_wake = 1;
+       int id = DAEMON_ID(s);
+       ldap_pvt_thread_mutex_lock( &slap_daemon[id].sd_mutex );
+
+       if( SLAP_SOCK_IS_ACTIVE( id, s ) && !SLAP_SOCK_IS_READ( id, s )) {
+               SLAP_SOCK_SET_READ( id, s );
+       } else {
+               do_wake = 0;
+       }
+       ldap_pvt_thread_mutex_unlock( &slap_daemon[id].sd_mutex );
+       if ( do_wake )
+               WAKE_LISTENER(id,wake);
+}
 
-       assert( SLAP_SOCK_IS_ACTIVE( s ));
-       if (!SLAP_SOCK_IS_READ( s )) SLAP_SOCK_SET_READ( s );
+time_t
+slapd_get_writetime()
+{
+       time_t cur;
+       ldap_pvt_thread_mutex_lock( &slap_daemon[0].sd_mutex );
+       cur = chk_writetime;
+       ldap_pvt_thread_mutex_unlock( &slap_daemon[0].sd_mutex );
+       return cur;
+}
 
-       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
-       WAKE_LISTENER(wake);
+void
+slapd_clr_writetime( time_t old )
+{
+       ldap_pvt_thread_mutex_lock( &slap_daemon[0].sd_mutex );
+       if ( chk_writetime == old )
+               chk_writetime = 0;
+       ldap_pvt_thread_mutex_unlock( &slap_daemon[0].sd_mutex );
 }
 
-static void slapd_close(ber_socket_t s) {
+static void
+slapd_close( ber_socket_t s )
+{
        Debug( LDAP_DEBUG_CONNS, "daemon: closing %ld\n",
                (long) s, 0, 0 );
-       tcp_close(s);
+       tcp_close( SLAP_FD2SOCK(s) );
+#ifdef HAVE_WINSOCK
+       slapd_sockdel( s );
+#endif
 }
 
-static void slap_free_listener_addresses(struct sockaddr **sal) {
+static void
+slap_free_listener_addresses( struct sockaddr **sal )
+{
        struct sockaddr **sap;
        if (sal == NULL) return;
        for (sap = sal; *sap != NULL; sap++) ch_free(*sap);
@@ -635,7 +1048,8 @@ static void slap_free_listener_addresses(struct sockaddr **sal) {
 }
 
 #if defined(LDAP_PF_LOCAL) || defined(SLAP_X_LISTENER_MOD)
-static int get_url_perms(
+static int
+get_url_perms(
        char    **exts,
        mode_t  *perms,
        int     *crit )
@@ -688,7 +1102,7 @@ static int get_url_perms(
                                                S_IRGRP, S_IWGRP, S_IXGRP,
                                                S_IROTH, S_IWOTH, S_IXOTH
                                        };
-                                       static char     c[] = "-rwxrwxrwx"; 
+                                       static const char       c[] = "-rwxrwxrwx"; 
 
                                        if ( value[ j ] == c[ j ] ) {
                                                p |= m[ j ];
@@ -715,10 +1129,11 @@ static int get_url_perms(
 #endif /* LDAP_PF_LOCAL || SLAP_X_LISTENER_MOD */
 
 /* port = 0 indicates AF_LOCAL */
-static int slap_get_listener_addresses(
+static int
+slap_get_listener_addresses(
        const char *host,
        unsigned short port,
-       struct sockaddr ***sal)
+       struct sockaddr ***sal )
 {
        struct sockaddr **sap;
 
@@ -745,7 +1160,7 @@ static int slap_get_listener_addresses(
                (*sap)->sa_family = AF_LOCAL;
                strcpy( ((struct sockaddr_un *)*sap)->sun_path, host );
        } else
-#endif
+#endif /* LDAP_PF_LOCAL */
        {
 #ifdef HAVE_GETADDRINFO
                struct addrinfo hints, *res, *sai;
@@ -793,7 +1208,7 @@ static int slap_get_listener_addresses(
                                *(struct sockaddr_in6 *)*sap =
                                        *((struct sockaddr_in6 *)sai->ai_addr);
                                break;
-#  endif
+#  endif /* LDAP_PF_INET6 */
                        case AF_INET:
                                *sap = ch_malloc(sizeof(struct sockaddr_in));
                                if (*sap == NULL) {
@@ -817,7 +1232,7 @@ static int slap_get_listener_addresses(
 
                freeaddrinfo(res);
 
-#else
+#else /* ! HAVE_GETADDRINFO */
                int i, n = 1;
                struct in_addr in;
                struct hostent *he = NULL;
@@ -851,7 +1266,7 @@ static int slap_get_listener_addresses(
                                sizeof(struct in_addr) );
                }
                sap[i] = NULL;
-#endif
+#endif /* ! HAVE_GETADDRINFO */
        }
 
        return 0;
@@ -861,11 +1276,11 @@ errexit:
        return -1;
 }
 
-static int slap_open_listener(
+static int
+slap_open_listener(
        const char* url,
        int *listeners,
-       int *cur
-       )
+       int *cur )
 {
        int     num, tmp, rc;
        Listener l;
@@ -875,6 +1290,7 @@ static int slap_open_listener(
        int err, addrlen = 0;
        struct sockaddr **sal, **psal;
        int socktype = SOCK_STREAM;     /* default to COTS */
+       ber_socket_t s;
 
 #if defined(LDAP_PF_LOCAL) || defined(SLAP_X_LISTENER_MOD)
        /*
@@ -894,9 +1310,7 @@ static int slap_open_listener(
 
        l.sl_url.bv_val = NULL;
        l.sl_mute = 0;
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
        l.sl_busy = 0;
-#endif
 
 #ifndef HAVE_TLS
        if( ldap_pvt_url_scheme2tls( lud->lud_scheme ) ) {
@@ -908,13 +1322,18 @@ static int slap_open_listener(
 
        if(! lud->lud_port ) lud->lud_port = LDAP_PORT;
 
-#else
+#else /* HAVE_TLS */
        l.sl_is_tls = ldap_pvt_url_scheme2tls( lud->lud_scheme );
 
        if(! lud->lud_port ) {
                lud->lud_port = l.sl_is_tls ? LDAPS_PORT : LDAP_PORT;
        }
-#endif
+#endif /* HAVE_TLS */
+
+#ifdef LDAP_TCP_BUFFER
+       l.sl_tcp_rmem = 0;
+       l.sl_tcp_wmem = 0;
+#endif /* LDAP_TCP_BUFFER */
 
        port = (unsigned short) lud->lud_port;
 
@@ -926,13 +1345,13 @@ static int slap_open_listener(
                } else {
                        err = slap_get_listener_addresses(lud->lud_host, 0, &sal);
                }
-#else
+#else /* ! LDAP_PF_LOCAL */
 
                Debug( LDAP_DEBUG_ANY, "daemon: URL scheme not supported: %s",
                        url, 0, 0);
                ldap_free_urldesc( lud );
                return -1;
-#endif
+#endif /* ! LDAP_PF_LOCAL */
        } else {
                if( lud->lud_host == NULL || lud->lud_host[0] == '\0'
                        || strcmp(lud->lud_host, "*") == 0 )
@@ -945,7 +1364,7 @@ static int slap_open_listener(
 
 #ifdef LDAP_CONNECTIONLESS
        l.sl_is_udp = ( tmp == LDAP_PROTO_UDP );
-#endif
+#endif /* LDAP_CONNECTIONLESS */
 
 #if defined(LDAP_PF_LOCAL) || defined(SLAP_X_LISTENER_MOD)
        if ( lud->lud_exts ) {
@@ -979,12 +1398,12 @@ static int slap_open_listener(
                case AF_INET6:
                        af = "IPv6";
                        break;
-#endif
+#endif /* LDAP_PF_INET6 */
 #ifdef LDAP_PF_LOCAL
                case AF_LOCAL:
                        af = "Local";
                        break;
-#endif
+#endif /* LDAP_PF_LOCAL */
                default:
                        sal++;
                        continue;
@@ -992,10 +1411,10 @@ static int slap_open_listener(
 
 #ifdef LDAP_CONNECTIONLESS
                if( l.sl_is_udp ) socktype = SOCK_DGRAM;
-#endif
+#endif /* LDAP_CONNECTIONLESS */
 
-               l.sl_sd = socket( (*sal)->sa_family, socktype, 0);
-               if ( l.sl_sd == AC_SOCKET_INVALID ) {
+               s = socket( (*sal)->sa_family, socktype, 0);
+               if ( s == AC_SOCKET_INVALID ) {
                        int err = sock_errno();
                        Debug( LDAP_DEBUG_ANY,
                                "daemon: %s socket() failed errno=%d (%s)\n",
@@ -1003,28 +1422,27 @@ static int slap_open_listener(
                        sal++;
                        continue;
                }
+               l.sl_sd = SLAP_SOCKNEW( s );
 
-#ifndef HAVE_WINSOCK
                if ( l.sl_sd >= dtblsize ) {
                        Debug( LDAP_DEBUG_ANY,
                                "daemon: listener descriptor %ld is too great %ld\n",
                                (long) l.sl_sd, (long) dtblsize, 0 );
-                       tcp_close( l.sl_sd );
+                       tcp_close( s );
                        sal++;
                        continue;
                }
-#endif
 
 #ifdef LDAP_PF_LOCAL
                if ( (*sal)->sa_family == AF_LOCAL ) {
                        unlink( ((struct sockaddr_un *)*sal)->sun_path );
                } else
-#endif
+#endif /* LDAP_PF_LOCAL */
                {
 #ifdef SO_REUSEADDR
                        /* enable address reuse */
                        tmp = 1;
-                       rc = setsockopt( l.sl_sd, SOL_SOCKET, SO_REUSEADDR,
+                       rc = setsockopt( s, SOL_SOCKET, SO_REUSEADDR,
                                (char *) &tmp, sizeof(tmp) );
                        if ( rc == AC_SOCKET_ERROR ) {
                                int err = sock_errno();
@@ -1032,7 +1450,7 @@ static int slap_open_listener(
                                        "setsockopt(SO_REUSEADDR) failed errno=%d (%s)\n",
                                        (long) l.sl_sd, err, sock_errstr(err) );
                        }
-#endif
+#endif /* SO_REUSEADDR */
                }
 
                switch( (*sal)->sa_family ) {
@@ -1044,7 +1462,7 @@ static int slap_open_listener(
 #ifdef IPV6_V6ONLY
                        /* Try to use IPv6 sockets for IPv6 only */
                        tmp = 1;
-                       rc = setsockopt( l.sl_sd, IPPROTO_IPV6, IPV6_V6ONLY,
+                       rc = setsockopt( , IPPROTO_IPV6, IPV6_V6ONLY,
                                (char *) &tmp, sizeof(tmp) );
                        if ( rc == AC_SOCKET_ERROR ) {
                                int err = sock_errno();
@@ -1052,30 +1470,53 @@ static int slap_open_listener(
                                        "setsockopt(IPV6_V6ONLY) failed errno=%d (%s)\n",
                                        (long) l.sl_sd, err, sock_errstr(err) );
                        }
-#endif
+#endif /* IPV6_V6ONLY */
                        addrlen = sizeof(struct sockaddr_in6);
                        break;
-#endif
+#endif /* LDAP_PF_INET6 */
 
 #ifdef LDAP_PF_LOCAL
                case AF_LOCAL:
 #ifdef LOCAL_CREDS
-               {
-                       int one = 1;
-                       setsockopt(l.sl_sd, 0, LOCAL_CREDS, &one, sizeof one);
-               }
-#endif
-               addrlen = sizeof(struct sockaddr_un);
-               break;
-#endif
+                       {
+                               int one = 1;
+                               setsockopt( s, 0, LOCAL_CREDS, &one, sizeof( one ) );
+                       }
+#endif /* LOCAL_CREDS */
+
+                       addrlen = sizeof( struct sockaddr_un );
+                       break;
+#endif /* LDAP_PF_LOCAL */
                }
 
-               if (bind(l.sl_sd, *sal, addrlen)) {
+#ifdef LDAP_PF_LOCAL
+               /* create socket with all permissions set for those systems
+                * that honor permissions on sockets (e.g. Linux); typically,
+                * only write is required.  To exploit filesystem permissions,
+                * place the socket in a directory and use directory's
+                * permissions.  Need write perms to the directory to 
+                * create/unlink the socket; likely need exec perms to access
+                * the socket (ITS#4709) */
+               {
+                       mode_t old_umask = 0;
+
+                       if ( (*sal)->sa_family == AF_LOCAL ) {
+                               old_umask = umask( 0 );
+                       }
+#endif /* LDAP_PF_LOCAL */
+                       rc = bind( s, *sal, addrlen );
+#ifdef LDAP_PF_LOCAL
+                       if ( old_umask != 0 ) {
+                               umask( old_umask );
+                       }
+               }
+#endif /* LDAP_PF_LOCAL */
+               if ( rc ) {
                        err = sock_errno();
                        Debug( LDAP_DEBUG_ANY,
                                "daemon: bind(%ld) failed errno=%d (%s)\n",
-                               (long) l.sl_sd, err, sock_errstr(err) );
-                       tcp_close( l.sl_sd );
+                               (long)l.sl_sd, err, sock_errstr( err ) );
+                       tcp_close( s );
                        sal++;
                        continue;
                }
@@ -1098,9 +1539,9 @@ static int slap_open_listener(
                        inet_ntop( AF_INET, &((struct sockaddr_in *)*sal)->sin_addr,
                                addr, sizeof(addr) );
                        s = addr;
-#else
+#else /* ! HAVE_GETADDRINFO || ! HAVE_INET_NTOP */
                        s = inet_ntoa( ((struct sockaddr_in *) *sal)->sin_addr );
-#endif
+#endif /* ! HAVE_GETADDRINFO || ! HAVE_INET_NTOP */
                        port = ntohs( ((struct sockaddr_in *)*sal) ->sin_port );
                        l.sl_name.bv_val =
                                ber_memalloc( sizeof("IP=255.255.255.255:65535") );
@@ -1116,9 +1557,9 @@ static int slap_open_listener(
                        inet_ntop( AF_INET6, &((struct sockaddr_in6 *)*sal)->sin6_addr,
                                addr, sizeof addr);
                        port = ntohs( ((struct sockaddr_in6 *)*sal)->sin6_port );
-                       l.sl_name.bv_len = strlen(addr) + sizeof("IP= 65535");
+                       l.sl_name.bv_len = strlen(addr) + sizeof("IP=[]:65535");
                        l.sl_name.bv_val = ber_memalloc( l.sl_name.bv_len );
-                       snprintf( l.sl_name.bv_val, l.sl_name.bv_len, "IP=%s %d", 
+                       snprintf( l.sl_name.bv_val, l.sl_name.bv_len, "IP=[%s]:%d", 
                                addr, port );
                        l.sl_name.bv_len = strlen( l.sl_name.bv_val );
                } break;
@@ -1155,7 +1596,10 @@ static int slap_open_listener(
 static int sockinit(void);
 static int sockdestroy(void);
 
-int slapd_daemon_init( const char *urls )
+static int daemon_inited = 0;
+
+int
+slapd_daemon_init( const char *urls )
 {
        int i, j, n, rc;
        char **u;
@@ -1163,33 +1607,41 @@ int slapd_daemon_init( const char *urls )
        Debug( LDAP_DEBUG_ARGS, "daemon_init: %s\n",
                urls ? urls : "<null>", 0, 0 );
 
-       ldap_pvt_thread_mutex_init( &slap_daemon.sd_mutex );
+       for ( i=0; i<MAX_DAEMON_THREADS; i++ ) {
+               wake_sds[i][0] = AC_SOCKET_INVALID;
+               wake_sds[i][1] = AC_SOCKET_INVALID;
+       }
+
+       ldap_pvt_thread_mutex_init( &slap_daemon[0].sd_mutex );
 #ifdef HAVE_TCPD
-       ldap_pvt_thread_mutex_init( &slap_daemon.tcpd_mutex );
-#endif
+       ldap_pvt_thread_mutex_init( &sd_tcpd_mutex );
+#endif /* TCP Wrappers */
+
+       daemon_inited = 1;
 
        if( (rc = sockinit()) != 0 ) return rc;
 
 #ifdef HAVE_SYSCONF
        dtblsize = sysconf( _SC_OPEN_MAX );
-#elif HAVE_GETDTABLESIZE
+#elif defined(HAVE_GETDTABLESIZE)
        dtblsize = getdtablesize();
-#else
+#else /* ! HAVE_SYSCONF && ! HAVE_GETDTABLESIZE */
        dtblsize = FD_SETSIZE;
-#endif
+#endif /* ! HAVE_SYSCONF && ! HAVE_GETDTABLESIZE */
 
        /* open a pipe (or something equivalent connected to itself).
         * we write a byte on this fd whenever we catch a signal. The main
         * loop will be select'ing on this socket, and will wake up when
         * this byte arrives.
         */
-       if( (rc = lutil_pair( wake_sds )) < 0 ) {
+       if( (rc = lutil_pair( wake_sds[0] )) < 0 ) {
                Debug( LDAP_DEBUG_ANY,
                        "daemon: lutil_pair() failed rc=%d\n", rc, 0, 0 );
                return rc;
        }
+       ber_pvt_socket_set_nonblock( wake_sds[0][1], 1 );
 
-       SLAP_SOCK_SET_INIT;
+       SLAP_SOCK_INIT(0);
 
        if( urls == NULL ) urls = "ldap:///";
 
@@ -1236,7 +1688,7 @@ int slapd_daemon_init( const char *urls )
                slapd_slp_init( urls );
                slapd_slp_reg();
        }
-#endif
+#endif /* HAVE_SLP */
 
        ldap_charray_free( u );
 
@@ -1245,11 +1697,30 @@ int slapd_daemon_init( const char *urls )
 
 
 int
-slapd_daemon_destroy(void)
+slapd_daemon_destroy( void )
 {
        connections_destroy();
-       tcp_close( wake_sds[1] );
-       tcp_close( wake_sds[0] );
+       if ( daemon_inited ) {
+               int i;
+
+               for ( i=0; i<slapd_daemon_threads; i++ ) {
+#ifdef HAVE_WINSOCK
+                       if ( wake_sds[i][1] != INVALID_SOCKET &&
+                               SLAP_FD2SOCK( wake_sds[i][1] ) != SLAP_FD2SOCK( wake_sds[i][0] ))
+#endif /* HAVE_WINSOCK */
+                               tcp_close( SLAP_FD2SOCK(wake_sds[i][1]) );
+#ifdef HAVE_WINSOCK
+                       if ( wake_sds[i][0] != INVALID_SOCKET )
+#endif /* HAVE_WINSOCK */
+                               tcp_close( SLAP_FD2SOCK(wake_sds[i][0]) );
+                       ldap_pvt_thread_mutex_destroy( &slap_daemon[i].sd_mutex );
+                       SLAP_SOCK_DESTROY(i);
+               }
+               daemon_inited = 0;
+#ifdef HAVE_TCPD
+               ldap_pvt_thread_mutex_destroy( &sd_tcpd_mutex );
+#endif /* TCP Wrappers */
+       }
        sockdestroy();
 
 #ifdef HAVE_SLP
@@ -1257,13 +1728,8 @@ slapd_daemon_destroy(void)
                slapd_slp_dereg();
                slapd_slp_deinit();
        }
-#endif
-
-#ifdef HAVE_TCPD
-       ldap_pvt_thread_mutex_destroy( &slap_daemon.tcpd_mutex );
-#endif
+#endif /* HAVE_SLP */
 
-       ldap_pvt_thread_mutex_destroy( &slap_daemon.sd_mutex );
        return 0;
 }
 
@@ -1274,11 +1740,17 @@ close_listeners(
 {
        int l;
 
+       if ( !listening )
+               return;
+       listening = 0;
+
        for ( l = 0; slap_listeners[l] != NULL; l++ ) {
                Listener *lr = slap_listeners[l];
 
                if ( lr->sl_sd != AC_SOCKET_INVALID ) {
-                       if ( remove ) slapd_remove( lr->sl_sd, NULL, 0, 0, 0 );
+                       int s = lr->sl_sd;
+                       lr->sl_sd = AC_SOCKET_INVALID;
+                       if ( remove ) slapd_remove( s, NULL, 0, 0, 0 );
 
 #ifdef LDAP_PF_LOCAL
                        if ( lr->sl_sa.sa_addr.sa_family == AF_LOCAL ) {
@@ -1286,9 +1758,20 @@ close_listeners(
                        }
 #endif /* LDAP_PF_LOCAL */
 
-                       slapd_close( lr->sl_sd );
+                       slapd_close( s );
                }
+       }
+}
+
+static void
+destroy_listeners( void )
+{
+       Listener *lr, **ll = slap_listeners;
+
+       if ( ll == NULL )
+               return;
 
+       while ( (lr = *ll++) != NULL ) {
                if ( lr->sl_url.bv_val ) {
                        ber_memfree( lr->sl_url.bv_val );
                }
@@ -1298,8 +1781,10 @@ close_listeners(
                }
 
                free( lr );
-               slap_listeners[l] = NULL;
        }
+
+       free( slap_listeners );
+       slap_listeners = NULL;
 }
 
 static int
@@ -1308,30 +1793,40 @@ slap_listener(
 {
        Sockaddr                from;
 
-       ber_socket_t s;
-       socklen_t len = sizeof(from);
-       long id;
+       ber_socket_t s, sfd;
+       ber_socklen_t len = sizeof(from);
+       Connection *c;
        slap_ssf_t ssf = 0;
        struct berval authid = BER_BVNULL;
 #ifdef SLAPD_RLOOKUPS
        char hbuf[NI_MAXHOST];
-#endif
+#endif /* SLAPD_RLOOKUPS */
 
        char    *dnsname = NULL;
        char    *peeraddr = NULL;
 #ifdef LDAP_PF_LOCAL
        char peername[MAXPATHLEN + sizeof("PATH=")];
+#ifdef LDAP_PF_LOCAL_SENDMSG
+       char peerbuf[8];
+       struct berval peerbv = BER_BVNULL;
+#endif
 #elif defined(LDAP_PF_INET6)
-       char peername[sizeof("IP=ffff:ffff:ffff:ffff:ffff:ffff:ffff:ffff 65535")];
-#else
+       char peername[sizeof("IP=[ffff:ffff:ffff:ffff:ffff:ffff:ffff:ffff]:65535")];
+#else /* ! LDAP_PF_LOCAL && ! LDAP_PF_INET6 */
        char peername[sizeof("IP=255.255.255.255:65336")];
 #endif /* LDAP_PF_LOCAL */
+       int cflag;
+       int tid;
+
+       Debug( LDAP_DEBUG_TRACE,
+               ">>> slap_listener(%s)\n",
+               sl->sl_url.bv_val, 0, 0 );
 
        peername[0] = '\0';
 
 #ifdef LDAP_CONNECTIONLESS
        if ( sl->sl_is_udp ) return 1;
-#endif
+#endif /* LDAP_CONNECTIONLESS */
 
 #  ifdef LDAP_PF_LOCAL
        /* FIXME: apparently accept doesn't fill
@@ -1339,15 +1834,13 @@ slap_listener(
        from.sa_un_addr.sun_path[0] = '\0';
 #  endif /* LDAP_PF_LOCAL */
 
-       s = accept( sl->sl_sd, (struct sockaddr *) &from, &len );
+       s = accept( SLAP_FD2SOCK( sl->sl_sd ), (struct sockaddr *) &from, &len );
 
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
        /* Resume the listener FD to allow concurrent-processing of
         * additional incoming connections.
         */
        sl->sl_busy = 0;
-       WAKE_LISTENER(1);
-#endif
+       WAKE_LISTENER(DAEMON_ID(sl->sl_sd),1);
 
        if ( s == AC_SOCKET_INVALID ) {
                int err = sock_errno();
@@ -1355,17 +1848,17 @@ slap_listener(
                if(
 #ifdef EMFILE
                    err == EMFILE ||
-#endif
+#endif /* EMFILE */
 #ifdef ENFILE
                    err == ENFILE ||
-#endif
+#endif /* ENFILE */
                    0 )
                {
-                       ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
+                       ldap_pvt_thread_mutex_lock( &slap_daemon[0].sd_mutex );
                        emfile++;
                        /* Stop listening until an existing session closes */
                        sl->sl_mute = 1;
-                       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
+                       ldap_pvt_thread_mutex_unlock( &slap_daemon[0].sd_mutex );
                }
 
                Debug( LDAP_DEBUG_ANY,
@@ -1374,26 +1867,26 @@ slap_listener(
                ldap_pvt_thread_yield();
                return 0;
        }
+       sfd = SLAP_SOCKNEW( s );
 
-#ifndef HAVE_WINSOCK
        /* make sure descriptor number isn't too great */
-       if ( s >= dtblsize ) {
+       if ( sfd >= dtblsize ) {
                Debug( LDAP_DEBUG_ANY,
                        "daemon: %ld beyond descriptor table size %ld\n",
-                       (long) s, (long) dtblsize, 0 );
+                       (long) sfd, (long) dtblsize, 0 );
 
-               slapd_close(s);
+               tcp_close(s);
                ldap_pvt_thread_yield();
                return 0;
        }
-#endif
+       tid = DAEMON_ID(sfd);
 
 #ifdef LDAP_DEBUG
-       ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
+       ldap_pvt_thread_mutex_lock( &slap_daemon[tid].sd_mutex );
        /* newly accepted stream should not be in any of the FD SETS */
-       assert( SLAP_SOCK_NOT_ACTIVE( s ));
-       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
-#endif
+       assert( SLAP_SOCK_NOT_ACTIVE( tid, sfd ));
+       ldap_pvt_thread_mutex_unlock( &slap_daemon[tid].sd_mutex );
+#endif /* LDAP_DEBUG */
 
 #if defined( SO_KEEPALIVE ) || defined( TCP_NODELAY )
 #ifdef LDAP_PF_LOCAL
@@ -1412,9 +1905,9 @@ slap_listener(
                        int err = sock_errno();
                        Debug( LDAP_DEBUG_ANY,
                                "slapd(%ld): setsockopt(SO_KEEPALIVE) failed "
-                               "errno=%d (%s)\n", (long) s, err, sock_errstr(err) );
+                               "errno=%d (%s)\n", (long) sfd, err, sock_errstr(err) );
                }
-#endif
+#endif /* SO_KEEPALIVE */
 #ifdef TCP_NODELAY
                /* enable no delay */
                tmp = 1;
@@ -1424,19 +1917,22 @@ slap_listener(
                        int err = sock_errno();
                        Debug( LDAP_DEBUG_ANY,
                                "slapd(%ld): setsockopt(TCP_NODELAY) failed "
-                               "errno=%d (%s)\n", (long) s, err, sock_errstr(err) );
+                               "errno=%d (%s)\n", (long) sfd, err, sock_errstr(err) );
                }
-#endif
+#endif /* TCP_NODELAY */
        }
-#endif
+#endif /* SO_KEEPALIVE || TCP_NODELAY */
 
        Debug( LDAP_DEBUG_CONNS,
                "daemon: listen=%ld, new connection on %ld\n",
-               (long) sl->sl_sd, (long) s, 0 );
+               (long) sl->sl_sd, (long) sfd, 0 );
 
+       cflag = 0;
        switch ( from.sa_addr.sa_family ) {
 #  ifdef LDAP_PF_LOCAL
        case AF_LOCAL:
+               cflag |= CONN_IS_IPC;
+
                /* FIXME: apparently accept doesn't fill
                 * the sun_path sun_path member */
                if ( from.sa_un_addr.sun_path[0] == '\0' ) {
@@ -1451,7 +1947,11 @@ slap_listener(
                        uid_t uid;
                        gid_t gid;
 
-                       if( getpeereid( s, &uid, &gid ) == 0 ) {
+#ifdef LDAP_PF_LOCAL_SENDMSG
+                       peerbv.bv_val = peerbuf;
+                       peerbv.bv_len = sizeof( peerbuf );
+#endif
+                       if( LUTIL_GETPEEREID( s, &uid, &gid, &peerbv ) == 0 ) {
                                authid.bv_val = ch_malloc(
                                        STRLENOF( "gidNumber=4294967295+uidNumber=4294967295,"
                                        "cn=peercred,cn=external,cn=auth" ) + 1 );
@@ -1482,7 +1982,7 @@ slap_listener(
                peeraddr = (char *) inet_ntop( AF_INET6,
                                      &from.sa_in6_addr.sin6_addr,
                                      addr, sizeof addr );
-               sprintf( peername, "IP=%s %d",
+               sprintf( peername, "IP=[%s]:%d",
                         peeraddr != NULL ? peeraddr : SLAP_STRING_UNKNOWN,
                         (unsigned) ntohs( from.sa_in6_addr.sin6_port ) );
        }
@@ -1490,21 +1990,21 @@ slap_listener(
 #  endif /* LDAP_PF_INET6 */
 
        case AF_INET:
-       peeraddr = inet_ntoa( from.sa_in_addr.sin_addr );
-       sprintf( peername, "IP=%s:%d",
-               peeraddr != NULL ? peeraddr : SLAP_STRING_UNKNOWN,
-               (unsigned) ntohs( from.sa_in_addr.sin_port ) );
+               peeraddr = inet_ntoa( from.sa_in_addr.sin_addr );
+               sprintf( peername, "IP=%s:%d",
+                       peeraddr != NULL ? peeraddr : SLAP_STRING_UNKNOWN,
+                       (unsigned) ntohs( from.sa_in_addr.sin_port ) );
                break;
 
        default:
-               slapd_close(s);
+               slapd_close(sfd);
                return 0;
        }
 
        if ( ( from.sa_addr.sa_family == AF_INET )
 #ifdef LDAP_PF_INET6
                || ( from.sa_addr.sa_family == AF_INET6 )
-#endif
+#endif /* LDAP_PF_INET6 */
                )
        {
                dnsname = NULL;
@@ -1522,69 +2022,68 @@ slap_listener(
 #ifdef HAVE_TCPD
                {
                        int rc;
-                       ldap_pvt_thread_mutex_lock( &slap_daemon.tcpd_mutex );
+                       ldap_pvt_thread_mutex_lock( &sd_tcpd_mutex );
                        rc = hosts_ctl("slapd",
                                dnsname != NULL ? dnsname : SLAP_STRING_UNKNOWN,
                                peeraddr != NULL ? peeraddr : SLAP_STRING_UNKNOWN,
                                SLAP_STRING_UNKNOWN );
-                       ldap_pvt_thread_mutex_unlock( &slap_daemon.tcpd_mutex );
+                       ldap_pvt_thread_mutex_unlock( &sd_tcpd_mutex );
                        if ( !rc ) {
                                /* DENY ACCESS */
                                Statslog( LDAP_DEBUG_STATS,
                                        "fd=%ld DENIED from %s (%s)\n",
-                                       (long) s,
+                                       (long) sfd,
                                        dnsname != NULL ? dnsname : SLAP_STRING_UNKNOWN,
                                        peeraddr != NULL ? peeraddr : SLAP_STRING_UNKNOWN,
                                        0, 0 );
-                               slapd_close(s);
+                               slapd_close(sfd);
                                return 0;
                        }
                }
 #endif /* HAVE_TCPD */
        }
 
-       id = connection_init(s, sl,
-               dnsname != NULL ? dnsname : SLAP_STRING_UNKNOWN,
-               peername,
 #ifdef HAVE_TLS
-               sl->sl_is_tls ? CONN_IS_TLS : 0,
-#else
-               0,
+       if ( sl->sl_is_tls ) cflag |= CONN_IS_TLS;
 #endif
-               ssf,
-               authid.bv_val ? &authid : NULL );
+       c = connection_init(sfd, sl,
+               dnsname != NULL ? dnsname : SLAP_STRING_UNKNOWN,
+               peername, cflag, ssf,
+               authid.bv_val ? &authid : NULL
+               LDAP_PF_LOCAL_SENDMSG_ARG(&peerbv));
 
        if( authid.bv_val ) ch_free(authid.bv_val);
 
-       if( id < 0 ) {
+       if( !c ) {
                Debug( LDAP_DEBUG_ANY,
                        "daemon: connection_init(%ld, %s, %s) failed.\n",
-                       (long) s, peername, sl->sl_name.bv_val );
-               slapd_close(s);
+                       (long) sfd, peername, sl->sl_name.bv_val );
+               slapd_close(sfd);
                return 0;
        }
 
        Statslog( LDAP_DEBUG_STATS,
                "conn=%ld fd=%ld ACCEPT from %s (%s)\n",
-               id, (long) s, peername, sl->sl_name.bv_val,
+               c->c_connid, (long) sfd, peername, sl->sl_name.bv_val,
                0 );
 
        return 0;
 }
 
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
 static void*
 slap_listener_thread(
        void* ctx,
        void* ptr )
 {
-       int rc;
+       int             rc;
+       Listener        *sl = (Listener *)ptr;
 
-       rc = slap_listener( (Listener*)ptr );
+       rc = slap_listener( sl );
 
        if( rc != LDAP_SUCCESS ) {
                Debug( LDAP_DEBUG_ANY,
-                       "listener_thread: failed %d", rc, 0, 0 );
+                       "slap_listener_thread(%s): failed err=%d",
+                       sl->sl_url.bv_val, rc, 0 );
        }
 
        return (void*)NULL;
@@ -1599,19 +2098,18 @@ slap_listener_activate(
        Debug( LDAP_DEBUG_TRACE, "slap_listener_activate(%d): %s\n",
                sl->sl_sd, sl->sl_busy ? "busy" : "", 0 );
 
-       sl->sl_busy++;
+       sl->sl_busy = 1;
 
        rc = ldap_pvt_thread_pool_submit( &connection_pool,
                slap_listener_thread, (void *) sl );
 
        if( rc != 0 ) {
                Debug( LDAP_DEBUG_ANY,
-                       "listener_activate(%d): submit failed (%d)\n",
+                       "slap_listener_activate(%d): submit failed (%d)\n",
                        sl->sl_sd, rc, 0 );
        }
        return rc;
 }
-#endif
 
 static void *
 slapd_daemon_task(
@@ -1619,27 +2117,18 @@ slapd_daemon_task(
 {
        int l;
        time_t last_idle_check = 0;
-       struct timeval idle;
        int ebadf = 0;
+       int tid = (int)ptr;
 
 #define SLAPD_IDLE_CHECK_LIMIT 4
 
-       if ( global_idletimeout > 0 ) {
-               last_idle_check = slap_get_time();
-               /* Set the select timeout.
-                * Don't just truncate, preserve the fractions of
-                * seconds to prevent sleeping for zero time.
-                */
-               idle.tv_sec = global_idletimeout / SLAPD_IDLE_CHECK_LIMIT;
-               idle.tv_usec = global_idletimeout - \
-                       ( idle.tv_sec * SLAPD_IDLE_CHECK_LIMIT );
-               idle.tv_usec *= 1000000 / SLAPD_IDLE_CHECK_LIMIT;
-       } else {
-               idle.tv_sec = 0;
-               idle.tv_usec = 0;
-       }
+       slapd_add( wake_sds[tid][0], 0, NULL, tid );
+       if ( tid )
+               goto loop;
 
-       slapd_add( wake_sds[0], 0, NULL );
+       /* Init stuff done only by thread 0 */
+
+       last_idle_check = slap_get_time();
 
        for ( l = 0; slap_listeners[l] != NULL; l++ ) {
                if ( slap_listeners[l]->sl_sd == AC_SOCKET_INVALID ) continue;
@@ -1651,9 +2140,134 @@ slapd_daemon_task(
                 */
                if ( slap_listeners[l]->sl_is_udp )
                        continue;
-#endif
+#endif /* LDAP_CONNECTIONLESS */
+
+               /* FIXME: TCP-only! */
+#ifdef LDAP_TCP_BUFFER
+               if ( 1 ) {
+                       int origsize, size, realsize, rc;
+                       socklen_t optlen;
+                       char buf[ SLAP_TEXT_BUFLEN ];
+
+                       size = 0;
+                       if ( slap_listeners[l]->sl_tcp_rmem > 0 ) {
+                               size = slap_listeners[l]->sl_tcp_rmem;
+                       } else if ( slapd_tcp_rmem > 0 ) {
+                               size = slapd_tcp_rmem;
+                       }
+
+                       if ( size > 0 ) {
+                               optlen = sizeof( origsize );
+                               rc = getsockopt( SLAP_FD2SOCK( slap_listeners[l]->sl_sd ),
+                                       SOL_SOCKET,
+                                       SO_RCVBUF,
+                                       (void *)&origsize,
+                                       &optlen );
+
+                               if ( rc ) {
+                                       int err = sock_errno();
+                                       Debug( LDAP_DEBUG_ANY,
+                                               "slapd_daemon_task: getsockopt(SO_RCVBUF) failed errno=%d (%s)\n",
+                                               err, sock_errstr(err), 0 );
+                               }
+
+                               optlen = sizeof( size );
+                               rc = setsockopt( SLAP_FD2SOCK( slap_listeners[l]->sl_sd ),
+                                       SOL_SOCKET,
+                                       SO_RCVBUF,
+                                       (const void *)&size,
+                                       optlen );
+
+                               if ( rc ) {
+                                       int err = sock_errno();
+                                       Debug( LDAP_DEBUG_ANY,
+                                               "slapd_daemon_task: setsockopt(SO_RCVBUF) failed errno=%d (%s)\n",
+                                               err, sock_errstr(err), 0 );
+                               }
 
-               if ( listen( slap_listeners[l]->sl_sd, SLAPD_LISTEN_BACKLOG ) == -1 ) {
+                               optlen = sizeof( realsize );
+                               rc = getsockopt( SLAP_FD2SOCK( slap_listeners[l]->sl_sd ),
+                                       SOL_SOCKET,
+                                       SO_RCVBUF,
+                                       (void *)&realsize,
+                                       &optlen );
+
+                               if ( rc ) {
+                                       int err = sock_errno();
+                                       Debug( LDAP_DEBUG_ANY,
+                                               "slapd_daemon_task: getsockopt(SO_RCVBUF) failed errno=%d (%s)\n",
+                                               err, sock_errstr(err), 0 );
+                               }
+
+                               snprintf( buf, sizeof( buf ),
+                                       "url=%s (#%d) RCVBUF original size=%d requested size=%d real size=%d", 
+                                       slap_listeners[l]->sl_url.bv_val, l, origsize, size, realsize );
+                               Debug( LDAP_DEBUG_ANY,
+                                       "slapd_daemon_task: %s\n",
+                                       buf, 0, 0 );
+                       }
+
+                       size = 0;
+                       if ( slap_listeners[l]->sl_tcp_wmem > 0 ) {
+                               size = slap_listeners[l]->sl_tcp_wmem;
+                       } else if ( slapd_tcp_wmem > 0 ) {
+                               size = slapd_tcp_wmem;
+                       }
+
+                       if ( size > 0 ) {
+                               optlen = sizeof( origsize );
+                               rc = getsockopt( SLAP_FD2SOCK( slap_listeners[l]->sl_sd ),
+                                       SOL_SOCKET,
+                                       SO_SNDBUF,
+                                       (void *)&origsize,
+                                       &optlen );
+
+                               if ( rc ) {
+                                       int err = sock_errno();
+                                       Debug( LDAP_DEBUG_ANY,
+                                               "slapd_daemon_task: getsockopt(SO_SNDBUF) failed errno=%d (%s)\n",
+                                               err, sock_errstr(err), 0 );
+                               }
+
+                               optlen = sizeof( size );
+                               rc = setsockopt( SLAP_FD2SOCK( slap_listeners[l]->sl_sd ),
+                                       SOL_SOCKET,
+                                       SO_SNDBUF,
+                                       (const void *)&size,
+                                       optlen );
+
+                               if ( rc ) {
+                                       int err = sock_errno();
+                                       Debug( LDAP_DEBUG_ANY,
+                                               "slapd_daemon_task: setsockopt(SO_SNDBUF) failed errno=%d (%s)",
+                                               err, sock_errstr(err), 0 );
+                               }
+
+                               optlen = sizeof( realsize );
+                               rc = getsockopt( SLAP_FD2SOCK( slap_listeners[l]->sl_sd ),
+                                       SOL_SOCKET,
+                                       SO_SNDBUF,
+                                       (void *)&realsize,
+                                       &optlen );
+
+                               if ( rc ) {
+                                       int err = sock_errno();
+                                       Debug( LDAP_DEBUG_ANY,
+                                               "slapd_daemon_task: getsockopt(SO_SNDBUF) failed errno=%d (%s)\n",
+                                               err, sock_errstr(err), 0 );
+                               }
+
+                               snprintf( buf, sizeof( buf ),
+                                       "url=%s (#%d) SNDBUF original size=%d requested size=%d real size=%d", 
+                                       slap_listeners[l]->sl_url.bv_val, l, origsize, size, realsize );
+                               Debug( LDAP_DEBUG_ANY,
+                                       "slapd_daemon_task: %s\n",
+                                       buf, 0, 0 );
+                       }
+               }
+#endif /* LDAP_TCP_BUFFER */
+
+               if ( listen( SLAP_FD2SOCK( slap_listeners[l]->sl_sd ), SLAPD_LISTEN_BACKLOG ) == -1 ) {
                        int err = sock_errno();
 
 #ifdef LDAP_PF_INET6
@@ -1690,7 +2304,7 @@ slapd_daemon_task(
                                        }
                                }
                        }
-#endif                         
+#endif /* LDAP_PF_INET6 */
                        Debug( LDAP_DEBUG_ANY,
                                "daemon: listen(%s, 5) failed errno=%d (%s)\n",
                                        slap_listeners[l]->sl_url.bv_val, err,
@@ -1698,48 +2312,39 @@ slapd_daemon_task(
                        return (void*)-1;
                }
 
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
                /* make the listening socket non-blocking */
-               if ( ber_pvt_socket_set_nonblock( slap_listeners[l]->sl_sd, 1 ) < 0 ) {
+               if ( ber_pvt_socket_set_nonblock( SLAP_FD2SOCK( slap_listeners[l]->sl_sd ), 1 ) < 0 ) {
                        Debug( LDAP_DEBUG_ANY, "slapd_daemon_task: "
                                "set nonblocking on a listening socket failed\n",
                                0, 0, 0 );
                        slapd_shutdown = 2;
                        return (void*)-1;
                }
-#endif
 
-               slapd_add( slap_listeners[l]->sl_sd, 0, slap_listeners[l] );
+               slapd_add( slap_listeners[l]->sl_sd, 0, slap_listeners[l], -1 );
        }
 
 #ifdef HAVE_NT_SERVICE_MANAGER
        if ( started_event != NULL ) {
                ldap_pvt_thread_cond_signal( &started_event );
        }
-#endif
+#endif /* HAVE_NT_SERVICE_MANAGER */
 
-#ifdef SLAP_SEM_LOAD_CONTROL
-       /*
-        * initialize count and lazyness of a semaphore
-        */
-       (void) ldap_lazy_sem_init(
-               SLAP_MAX_WORKER_THREADS + 4 /* max workers + margin */,
-               4 /* lazyness */ );
-#endif
+loop:
 
        /* initialization complete. Here comes the loop. */
 
        while ( !slapd_shutdown ) {
-               ber_socket_t i;
-               int ns, nwriters;
-               int at;
-               ber_socket_t nfds;
+               ber_socket_t            i;
+               int                     ns, nwriters;
+               int                     at;
+               ber_socket_t            nfds;
 #if SLAP_EVENTS_ARE_INDEXED
-               ber_socket_t nrfds, nwfds;
-#endif
+               ber_socket_t            nrfds, nwfds;
+#endif /* SLAP_EVENTS_ARE_INDEXED */
 #define SLAPD_EBADF_LIMIT 16
 
-               time_t  now;
+               time_t                  now;
 
                SLAP_EVENT_DECL;
 
@@ -1747,23 +2352,45 @@ slapd_daemon_task(
                struct timeval          *tvp;
 
                struct timeval          cat;
-               time_t                          tdelta = 1;
+               time_t                  tdelta = 1;
                struct re_s*            rtask;
+
                now = slap_get_time();
 
-               if( ( global_idletimeout > 0 ) &&
-                       difftime( last_idle_check +
-                       global_idletimeout/SLAPD_IDLE_CHECK_LIMIT, now ) < 0 ) {
-                       connections_timeout_idle( now );
-                       last_idle_check = now;
+               if ( !tid && ( global_idletimeout > 0 || chk_writetime )) {
+                       int check = 0;
+                       /* Set the select timeout.
+                        * Don't just truncate, preserve the fractions of
+                        * seconds to prevent sleeping for zero time.
+                        */
+                       if ( chk_writetime ) {
+                               tv.tv_sec = global_writetimeout;
+                               tv.tv_usec = 0;
+                               if ( difftime( chk_writetime, now ) < 0 )
+                                       check = 2;
+                       } else {
+                               tv.tv_sec = global_idletimeout / SLAPD_IDLE_CHECK_LIMIT;
+                               tv.tv_usec = global_idletimeout - \
+                                       ( tv.tv_sec * SLAPD_IDLE_CHECK_LIMIT );
+                               tv.tv_usec *= 1000000 / SLAPD_IDLE_CHECK_LIMIT;
+                               if ( difftime( last_idle_check +
+                                       global_idletimeout/SLAPD_IDLE_CHECK_LIMIT, now ) < 0 )
+                                       check = 1;
+                       }
+                       if ( check ) {
+                               connections_timeout_idle( now );
+                               last_idle_check = now;
+                       }
+               } else {
+                       tv.tv_sec = 0;
+                       tv.tv_usec = 0;
                }
-               tv = idle;
 
 #ifdef SIGHUP
-               if( slapd_gentle_shutdown ) {
+               if ( slapd_gentle_shutdown ) {
                        ber_socket_t active;
 
-                       if( slapd_gentle_shutdown == 1 ) {
+                       if ( !tid && slapd_gentle_shutdown == 1 ) {
                                BackendDB *be;
                                Debug( LDAP_DEBUG_ANY, "slapd gentle shutdown\n", 0, 0, 0 );
                                close_listeners( 1 );
@@ -1774,50 +2401,58 @@ slapd_daemon_task(
                                slapd_gentle_shutdown = 2;
                        }
 
-                       ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
-                       active = slap_daemon.sd_nactives;
-                       ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
-                       if( active == 0 ) {
-                               slapd_shutdown = 1;
-                               break;
+                       ldap_pvt_thread_mutex_lock( &slap_daemon[tid].sd_mutex );
+                       active = slap_daemon[tid].sd_nactives;
+                       ldap_pvt_thread_mutex_unlock( &slap_daemon[tid].sd_mutex );
+
+                       if ( active == 0 ) {
+                               if ( !tid ) {
+                                       for ( l=1; l<slapd_daemon_threads; l++ ) {
+                                               ldap_pvt_thread_mutex_lock( &slap_daemon[l].sd_mutex );
+                                               active += slap_daemon[l].sd_nactives;
+                                               ldap_pvt_thread_mutex_unlock( &slap_daemon[l].sd_mutex );
+                                       }
+                                       if ( !active )
+                                               slapd_shutdown = 1;
+                               }
+                               if ( !active )
+                                       break;
                        }
                }
-#endif
+#endif /* SIGHUP */
                at = 0;
 
-               ldap_pvt_thread_mutex_lock( &slap_daemon.sd_mutex );
+               ldap_pvt_thread_mutex_lock( &slap_daemon[tid].sd_mutex );
 
-               nwriters = slap_daemon.sd_nwriters;
+               nwriters = slap_daemon[tid].sd_nwriters;
 
+               if ( listening )
                for ( l = 0; slap_listeners[l] != NULL; l++ ) {
                        Listener *lr = slap_listeners[l];
 
                        if ( lr->sl_sd == AC_SOCKET_INVALID ) continue;
+                       if ( DAEMON_ID( lr->sl_sd ) != tid ) continue;
 
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
                        if ( lr->sl_mute || lr->sl_busy )
-#else
-                       if ( lr->sl_mute )
-#endif
                        {
-                           SLAP_SOCK_CLR_READ( lr->sl_sd );
+                               SLAP_SOCK_CLR_READ( tid, lr->sl_sd );
                        } else {
-                               SLAP_SOCK_SET_READ( lr->sl_sd );
+                               SLAP_SOCK_SET_READ( tid, lr->sl_sd );
                        }
                }
 
-               SLAP_EVENT_INIT;
+               SLAP_EVENT_INIT(tid);
 
-               nfds = SLAP_EVENT_MAX;
+               nfds = SLAP_EVENT_MAX(tid);
 
-               if ( global_idletimeout && slap_daemon.sd_nactives ) at = 1;
+               if (( chk_writetime || global_idletimeout ) && slap_daemon[tid].sd_nactives ) at = 1;
 
-               ldap_pvt_thread_mutex_unlock( &slap_daemon.sd_mutex );
+               ldap_pvt_thread_mutex_unlock( &slap_daemon[tid].sd_mutex );
 
                if ( at 
 #if defined(HAVE_YIELDING_SELECT) || defined(NO_THREADS)
                        &&  ( tv.tv_sec || tv.tv_usec )
-#endif
+#endif /* HAVE_YIELDING_SELECT || NO_THREADS */
                        )
                {
                        tvp = &tv;
@@ -1825,30 +2460,39 @@ slapd_daemon_task(
                        tvp = NULL;
                }
 
-               ldap_pvt_thread_mutex_lock( &slapd_rq.rq_mutex );
-               rtask = ldap_pvt_runqueue_next_sched( &slapd_rq, &cat );
-               while ( rtask && cat.tv_sec && cat.tv_sec <= now ) {
-                       if ( ldap_pvt_runqueue_isrunning( &slapd_rq, rtask )) {
-                               ldap_pvt_runqueue_resched( &slapd_rq, rtask, 0 );
-                       } else {
-                               ldap_pvt_runqueue_runtask( &slapd_rq, rtask );
-                               ldap_pvt_runqueue_resched( &slapd_rq, rtask, 0 );
-                               ldap_pvt_thread_mutex_unlock( &slapd_rq.rq_mutex );
-                               ldap_pvt_thread_pool_submit( &connection_pool,
-                                       rtask->routine, (void *) rtask );
-                               ldap_pvt_thread_mutex_lock( &slapd_rq.rq_mutex );
-                       }
+               /* Only thread 0 handles runqueue */
+               if ( !tid ) {
+                       ldap_pvt_thread_mutex_lock( &slapd_rq.rq_mutex );
                        rtask = ldap_pvt_runqueue_next_sched( &slapd_rq, &cat );
-               }
-               ldap_pvt_thread_mutex_unlock( &slapd_rq.rq_mutex );
-
-               if ( rtask && cat.tv_sec ) {
-                       time_t diff = difftime( cat.tv_sec, now );
-                       if ( diff == 0 ) diff = tdelta;
-                       if ( tvp == NULL || diff < tv.tv_sec ) {
-                               tv.tv_sec = diff;
-                               tv.tv_usec = 0;
-                               tvp = &tv;
+                       while ( rtask && cat.tv_sec && cat.tv_sec <= now ) {
+                               if ( ldap_pvt_runqueue_isrunning( &slapd_rq, rtask )) {
+                                       ldap_pvt_runqueue_resched( &slapd_rq, rtask, 0 );
+                               } else {
+                                       ldap_pvt_runqueue_runtask( &slapd_rq, rtask );
+                                       ldap_pvt_runqueue_resched( &slapd_rq, rtask, 0 );
+                                       ldap_pvt_thread_mutex_unlock( &slapd_rq.rq_mutex );
+                                       ldap_pvt_thread_pool_submit( &connection_pool,
+                                               rtask->routine, (void *) rtask );
+                                       ldap_pvt_thread_mutex_lock( &slapd_rq.rq_mutex );
+                               }
+                               rtask = ldap_pvt_runqueue_next_sched( &slapd_rq, &cat );
+                       }
+                       ldap_pvt_thread_mutex_unlock( &slapd_rq.rq_mutex );
+
+                       if ( rtask && cat.tv_sec ) {
+                               /* NOTE: diff __should__ always be >= 0,
+                                * AFAI understand; however (ITS#4872),
+                                * time_t might be unsigned in some systems,
+                                * while difftime() returns a double */
+                               double diff = difftime( cat.tv_sec, now );
+                               if ( diff <= 0 ) {
+                                       diff = tdelta;
+                               }
+                               if ( tvp == NULL || diff < tv.tv_sec ) {
+                                       tv.tv_sec = diff;
+                                       tv.tv_usec = 0;
+                                       tvp = &tv;
+                               }
                        }
                }
 
@@ -1861,40 +2505,47 @@ slapd_daemon_task(
 
                        if ( lr->sl_mute ) {
                                Debug( LDAP_DEBUG_CONNS,
-                                       "daemon: select: listen=%d muted\n",
+                                       "daemon: " SLAP_EVENT_FNAME ": "
+                                       "listen=%d muted\n",
                                        lr->sl_sd, 0, 0 );
                                continue;
                        }
 
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
                        if ( lr->sl_busy ) {
                                Debug( LDAP_DEBUG_CONNS,
-                                       "daemon: select: listen=%d busy\n",
+                                       "daemon: " SLAP_EVENT_FNAME ": "
+                                       "listen=%d busy\n",
                                        lr->sl_sd, 0, 0 );
                                continue;
                        }
-#endif
 
                        Debug( LDAP_DEBUG_CONNS,
-                               "daemon: select: listen=%d active_threads=%d tvp=%s\n",
+                               "daemon: " SLAP_EVENT_FNAME ": "
+                               "listen=%d active_threads=%d tvp=%s\n",
                                lr->sl_sd, at, tvp == NULL ? "NULL" : "zero" );
                }
 
-               switch(ns = SLAP_EVENT_WAIT(tvp)) {
+               SLAP_EVENT_WAIT( tid, tvp, &ns );
+               switch ( ns ) {
                case -1: {      /* failure - try again */
                                int err = sock_errno();
 
-                               if( err != EINTR ) {
+                               if ( err != EINTR ) {
                                        ebadf++;
 
                                        /* Don't log unless we got it twice in a row */
-                                       if ( !( ebadf & 1 )) {
+                                       if ( !( ebadf & 1 ) ) {
                                                Debug( LDAP_DEBUG_ANY,
-                                                       "daemon: select failed count %d err (%d): %s\n",
-                                                       ebadf, err, sock_errstr(err) );
+                                                       "daemon: "
+                                                       SLAP_EVENT_FNAME
+                                                       " failed count %d "
+                                                       "err (%d): %s\n",
+                                                       ebadf, err,
+                                                       sock_errstr( err ) );
                                        }
-                                       if ( ebadf >= SLAPD_EBADF_LIMIT )
+                                       if ( ebadf >= SLAPD_EBADF_LIMIT ) {
                                                slapd_shutdown = 2;
+                                       }
                                }
                        }
                        continue;
@@ -1902,15 +2553,16 @@ slapd_daemon_task(
                case 0:         /* timeout - let threads run */
                        ebadf = 0;
 #ifndef HAVE_YIELDING_SELECT
-                       Debug( LDAP_DEBUG_CONNS, "daemon: select timeout - yielding\n",
-                           0, 0, 0 );
+                       Debug( LDAP_DEBUG_CONNS, "daemon: " SLAP_EVENT_FNAME
+                               "timeout - yielding\n",
+                               0, 0, 0 );
 
                        ldap_pvt_thread_yield();
-#endif
+#endif /* ! HAVE_YIELDING_SELECT */
                        continue;
 
                default:        /* something happened - deal with it */
-                       if( slapd_shutdown ) continue;
+                       if ( slapd_shutdown ) continue;
 
                        ebadf = 0;
                        Debug( LDAP_DEBUG_CONNS,
@@ -1920,11 +2572,11 @@ slapd_daemon_task(
                }
 
 #if SLAP_EVENTS_ARE_INDEXED
-               if ( SLAP_EVENT_IS_READ( wake_sds[0] )) {
+               if ( SLAP_EVENT_IS_READ( wake_sds[tid][0] ) ) {
                        char c[BUFSIZ];
-                       SLAP_EVENT_CLR_READ( wake_sds[0] );
+                       SLAP_EVENT_CLR_READ( wake_sds[tid][0] );
                        waking = 0;
-                       tcp_read( wake_sds[0], c, sizeof(c) );
+                       tcp_read( SLAP_FD2SOCK(wake_sds[tid][0]), c, sizeof(c) );
                        Debug( LDAP_DEBUG_CONNS, "daemon: waked\n", 0, 0, 0 );
                        continue;
                }
@@ -1933,6 +2585,7 @@ slapd_daemon_task(
                 * true for Unix select and poll. We treat Windows select
                 * like this too, even though it's a kludge.
                 */
+               if ( listening )
                for ( l = 0; slap_listeners[l] != NULL; l++ ) {
                        int rc;
 
@@ -1940,43 +2593,26 @@ slapd_daemon_task(
                        if ( slap_listeners[l]->sl_sd == AC_SOCKET_INVALID ) continue;
 #ifdef LDAP_CONNECTIONLESS
                        if ( slap_listeners[l]->sl_is_udp ) continue;
-#endif
-                       if ( !SLAP_EVENT_IS_READ( slap_listeners[l]->sl_sd )) continue;
+#endif /* LDAP_CONNECTIONLESS */
+                       if ( !SLAP_EVENT_IS_READ( slap_listeners[l]->sl_sd ) ) continue;
                        
                        /* clear events */
                        SLAP_EVENT_CLR_READ( slap_listeners[l]->sl_sd );
                        SLAP_EVENT_CLR_WRITE( slap_listeners[l]->sl_sd );
                        ns--;
 
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
-                       rc = slap_listener_activate(slap_listeners[l]);
-#else
-                       rc = slap_listener(slap_listeners[l]);
-#endif
+                       rc = slap_listener_activate( slap_listeners[l] );
                }
 
                /* bypass the following tests if no descriptors left */
                if ( ns <= 0 ) {
 #ifndef HAVE_YIELDING_SELECT
                        ldap_pvt_thread_yield();
-#endif
+#endif /* HAVE_YIELDING_SELECT */
                        continue;
                }
 
                Debug( LDAP_DEBUG_CONNS, "daemon: activity on:", 0, 0, 0 );
-#ifdef HAVE_WINSOCK
-               nrfds = readfds.fd_count;
-               nwfds = writefds.fd_count;
-               for ( i = 0; i < readfds.fd_count; i++ ) {
-                       Debug( LDAP_DEBUG_CONNS, " %d%s",
-                               readfds.fd_array[i], "r", 0 );
-               }
-               for ( i = 0; i < writefds.fd_count; i++ ) {
-                       Debug( LDAP_DEBUG_CONNS, " %d%s",
-                               writefds.fd_array[i], "w", 0 );
-               }
-
-#else
                nrfds = 0;
                nwfds = 0;
                for ( i = 0; i < nfds; i++ ) {
@@ -1999,19 +2635,13 @@ slapd_daemon_task(
                        }
                        if ( ns <= 0 ) break;
                }
-#endif
                Debug( LDAP_DEBUG_CONNS, "\n", 0, 0, 0 );
 
-
                /* loop through the writers */
                for ( i = 0; nwfds > 0; i++ ) {
                        ber_socket_t wd;
-#ifdef HAVE_WINSOCK
-                       wd = writefds.fd_array[i];
-#else
-                       if( ! SLAP_EVENT_IS_WRITE( i ) ) continue;
+                       if ( ! SLAP_EVENT_IS_WRITE( i ) ) continue;
                        wd = i;
-#endif
 
                        SLAP_EVENT_CLR_WRITE( wd );
                        nwfds--;
@@ -2030,7 +2660,7 @@ slapd_daemon_task(
                         * close it here. It has already been closed in connection.c.
                         */
                        if ( connection_write( wd ) < 0 ) {
-                               if ( SLAP_EVENT_IS_READ( wd )) {
+                               if ( SLAP_EVENT_IS_READ( wd ) ) {
                                        SLAP_EVENT_CLR_READ( (unsigned) wd );
                                        nrfds--;
                                }
@@ -2039,12 +2669,8 @@ slapd_daemon_task(
 
                for ( i = 0; nrfds > 0; i++ ) {
                        ber_socket_t rd;
-#ifdef HAVE_WINSOCK
-                       rd = readfds.fd_array[i];
-#else
-                       if( ! SLAP_EVENT_IS_READ( i ) ) continue;
+                       if ( ! SLAP_EVENT_IS_READ( i ) ) continue;
                        rd = i;
-#endif
                        SLAP_EVENT_CLR_READ( rd );
                        nrfds--;
 
@@ -2057,11 +2683,7 @@ slapd_daemon_task(
                         * active.
                         */
 
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
                        connection_read_activate( rd );
-#else
-                       connection_read( rd );
-#endif
                }
 #else  /* !SLAP_EVENTS_ARE_INDEXED */
        /* FIXME */
@@ -2083,41 +2705,38 @@ slapd_daemon_task(
 #ifdef LDAP_DEBUG
                Debug( LDAP_DEBUG_CONNS, "daemon: activity on:", 0, 0, 0 );
 
-               for (i=0; i<ns; i++) {
-                       int     r, w;
+               for ( i = 0; i < ns; i++ ) {
+                       int     r, w, fd;
 
                        /* Don't log listener events */
-                       if ( SLAP_EVENT_IS_LISTENER(i)
+                       if ( SLAP_EVENT_IS_LISTENER( tid, i )
 #ifdef LDAP_CONNECTIONLESS
-                               && !((SLAP_EVENT_LISTENER(i))->sl_is_udp)
-#endif
+                               && !( (SLAP_EVENT_LISTENER( tid, i ))->sl_is_udp )
+#endif /* LDAP_CONNECTIONLESS */
                                )
                        {
                                continue;
                        }
 
+                       fd = SLAP_EVENT_FD( tid, i );
                        /* Don't log internal wake events */
-                       if ( SLAP_EVENT_FD( i ) == wake_sds[0] ) continue;
+                       if ( fd == wake_sds[tid][0] ) continue;
 
                        r = SLAP_EVENT_IS_READ( i );
                        w = SLAP_EVENT_IS_WRITE( i );
                        if ( r || w ) {
-                               Debug( LDAP_DEBUG_CONNS, " %d%s%s", SLAP_EVENT_FD(i),
+                               Debug( LDAP_DEBUG_CONNS, " %d%s%s", fd,
                                    r ? "r" : "", w ? "w" : "" );
                        }
                }
                Debug( LDAP_DEBUG_CONNS, "\n", 0, 0, 0 );
-#endif
+#endif /* LDAP_DEBUG */
 
-               for (i=0; i<ns; i++) {
-                       int rc = 1, fd;
+               for ( i = 0; i < ns; i++ ) {
+                       int rc = 1, fd, w = 0, r = 0;
 
-                       if ( SLAP_EVENT_IS_LISTENER(i) ) {
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
-                               rc = slap_listener_activate( SLAP_EVENT_LISTENER( i ));
-#else
-                               rc = slap_listener( SLAP_EVENT_LISTENER( i ));
-#endif
+                       if ( SLAP_EVENT_IS_LISTENER( tid, i ) ) {
+                               rc = slap_listener_activate( SLAP_EVENT_LISTENER( tid, i ) );
                        }
 
                        /* If we found a regular listener, rc is now zero, and we
@@ -2125,22 +2744,23 @@ slapd_daemon_task(
                         * then rc is still 1, and we want to handle the data.
                         */
                        if ( rc ) {
-                               fd = SLAP_EVENT_FD( i );
+                               fd = SLAP_EVENT_FD( tid, i );
 
                                /* Handle wake events */
-                               if ( fd == wake_sds[0] ) {
+                               if ( fd == wake_sds[tid][0] ) {
                                        char c[BUFSIZ];
                                        waking = 0;
-                                       tcp_read( wake_sds[0], c, sizeof(c) );
-                                       break;
+                                       tcp_read( SLAP_FD2SOCK(wake_sds[tid][0]), c, sizeof(c) );
+                                       continue;
                                }
 
-                               if( SLAP_EVENT_IS_WRITE( i ) ) {
+                               if ( SLAP_EVENT_IS_WRITE( i ) ) {
                                        Debug( LDAP_DEBUG_CONNS,
                                                "daemon: write active on %d\n",
                                                fd, 0, 0 );
 
                                        SLAP_EVENT_CLR_WRITE( i );
+                                       w = 1;
 
                                        /*
                                         * NOTE: it is possible that the connection was closed
@@ -2153,26 +2773,25 @@ slapd_daemon_task(
                                        }
                                }
                                /* If event is a read */
-                               if( SLAP_EVENT_IS_READ( i )) {
+                               if ( SLAP_EVENT_IS_READ( i ))
+                                       r = 1;
+                               if ( r || !w ) {
                                        Debug( LDAP_DEBUG_CONNS,
                                                "daemon: read active on %d\n",
                                                fd, 0, 0 );
 
-                                       SLAP_EVENT_CLR_READ( i );
-#ifdef SLAP_LIGHTWEIGHT_DISPATCHER
-                                       connection_read_activate( fd );
-#else
-                                       /*
-                                        * NOTE: it is possible that the connection was closed
-                                        * and that the stream is now inactive.
-                                        * connection_read() must valid the stream is still
-                                        * active.
-                                        */
-                                       connection_read( fd );
+                                       if ( r ) {
+                                               SLAP_EVENT_CLR_READ( i );
+                                       } else {
+#ifdef HAVE_EPOLL
+                                               /* Don't keep reporting the hangup
+                                                */
+                                               if ( SLAP_SOCK_IS_ACTIVE( tid, fd )) {
+                                                       SLAP_EPOLL_SOCK_SET( tid, fd, EPOLLET );
+                                               }
 #endif
-                               } else {
-                                       Debug( LDAP_DEBUG_CONNS,
-                                               "daemon: hangup on %d\n", fd, 0, 0 );
+                                       }
+                                       connection_read_activate( fd );
                                }
                        }
                }
@@ -2180,10 +2799,14 @@ slapd_daemon_task(
 
 #ifndef HAVE_YIELDING_SELECT
                ldap_pvt_thread_yield();
-#endif
+#endif /* ! HAVE_YIELDING_SELECT */
        }
 
-       if( slapd_shutdown == 1 ) {
+       /* Only thread 0 handles shutdown */
+       if ( tid )
+               return NULL;
+
+       if ( slapd_shutdown == 1 ) {
                Debug( LDAP_DEBUG_ANY,
                        "daemon: shutdown requested and initiated.\n",
                        0, 0, 0 );
@@ -2204,43 +2827,47 @@ slapd_daemon_task(
                       0, 0, 0 );
        }
 
-       if( slapd_gentle_shutdown != 2 ) close_listeners ( 0 );
+       close_listeners( 0 );
 
-       if( !slapd_gentle_shutdown ) {
+       if ( !slapd_gentle_shutdown ) {
                slapd_abrupt_shutdown = 1;
                connections_shutdown();
        }
 
-       Debug( LDAP_DEBUG_ANY,
-           "slapd shutdown: waiting for %d threads to terminate\n",
-           ldap_pvt_thread_pool_backload(&connection_pool), 0, 0 );
-       ldap_pvt_thread_pool_destroy(&connection_pool, 1);
-
-       free ( slap_listeners );
-       slap_listeners = NULL;
+       if ( LogTest( LDAP_DEBUG_ANY )) {
+               int t = ldap_pvt_thread_pool_backload( &connection_pool );
+               Debug( LDAP_DEBUG_ANY,
+                       "slapd shutdown: waiting for %d operations/tasks to finish\n",
+                       t, 0, 0 );
+       }
+       ldap_pvt_thread_pool_destroy( &connection_pool, 1 );
 
        return NULL;
 }
 
 
 #ifdef LDAP_CONNECTIONLESS
-static int connectionless_init(void)
+static int
+connectionless_init( void )
 {
        int l;
 
        for ( l = 0; slap_listeners[l] != NULL; l++ ) {
                Listener *lr = slap_listeners[l];
-               long id;
+               Connection *c;
 
-               if( !lr->sl_is_udp ) {
+               if ( !lr->sl_is_udp ) {
                        continue;
                }
 
-               id = connection_init( lr->sl_sd, lr, "", "", CONN_IS_UDP, (slap_ssf_t) 0, NULL );
+               c = connection_init( lr->sl_sd, lr, "", "",
+                       CONN_IS_UDP, (slap_ssf_t) 0, NULL
+                       LDAP_PF_LOCAL_SENDMSG_ARG(NULL));
 
-               if( id < 0 ) {
+               if ( !c ) {
                        Debug( LDAP_DEBUG_TRACE,
-                               "connectionless_init: failed on %s (%d)\n", lr->sl_url, lr->sl_sd, 0 );
+                               "connectionless_init: failed on %s (%d)\n",
+                               lr->sl_url.bv_val, lr->sl_sd, 0 );
                        return -1;
                }
                lr->sl_is_udp++;
@@ -2250,46 +2877,61 @@ static int connectionless_init(void)
 }
 #endif /* LDAP_CONNECTIONLESS */
 
-int slapd_daemon( void )
+int
+slapd_daemon( void )
 {
-       int rc;
+       int i, rc;
+       ldap_pvt_thread_t       *listener_tid;
 
-       connections_init();
 #ifdef LDAP_CONNECTIONLESS
        connectionless_init();
-#endif
+#endif /* LDAP_CONNECTIONLESS */
+
+       listener_tid = ch_malloc(slapd_daemon_threads * sizeof(ldap_pvt_thread_t));
 
-#define SLAPD_LISTENER_THREAD 1
-#if defined( SLAPD_LISTENER_THREAD )
+       /* daemon_init only inits element 0 */
+       for ( i=1; i<slapd_daemon_threads; i++ )
        {
-               ldap_pvt_thread_t       listener_tid;
+               ldap_pvt_thread_mutex_init( &slap_daemon[i].sd_mutex );
 
+               if( (rc = lutil_pair( wake_sds[i] )) < 0 ) {
+                       Debug( LDAP_DEBUG_ANY,
+                               "daemon: lutil_pair() failed rc=%d\n", rc, 0, 0 );
+                       return rc;
+               }
+               ber_pvt_socket_set_nonblock( wake_sds[i][1], 1 );
+
+               SLAP_SOCK_INIT(i);
+       }
+
+       for ( i=0; i<slapd_daemon_threads; i++ )
+       {
                /* listener as a separate THREAD */
-               rc = ldap_pvt_thread_create( &listener_tid,
-                       0, slapd_daemon_task, NULL );
+               rc = ldap_pvt_thread_create( &listener_tid[i],
+                       0, slapd_daemon_task, (void *)i );
 
                if ( rc != 0 ) {
                        Debug( LDAP_DEBUG_ANY,
                        "listener ldap_pvt_thread_create failed (%d)\n", rc, 0, 0 );
                        return rc;
                }
-               /* wait for the listener thread to complete */
-               ldap_pvt_thread_join( listener_tid, (void *) NULL );
        }
-#else
-       /* experimental code */
-       slapd_daemon_task( NULL );
-#endif
 
-       return 0;
+       /* wait for the listener threads to complete */
+       for ( i=0; i<slapd_daemon_threads; i++ )
+               ldap_pvt_thread_join( listener_tid[i], (void *)NULL );
 
+       destroy_listeners();
+       ch_free( listener_tid );
+
+       return 0;
 }
 
-static int sockinit(void)
+static int
+sockinit( void )
 {
 #if defined( HAVE_WINSOCK2 )
-    WORD wVersionRequested;
+       WORD wVersionRequested;
        WSADATA wsaData;
        int err;
 
@@ -2321,17 +2963,17 @@ static int sockinit(void)
 #elif defined( HAVE_WINSOCK )
        WSADATA wsaData;
        if ( WSAStartup( 0x0101, &wsaData ) != 0 ) return -1;
-#endif
+#endif /* ! HAVE_WINSOCK2 && ! HAVE_WINSOCK */
 
        return 0;
 }
 
-static int sockdestroy(void)
+static int
+sockdestroy( void )
 {
 #if defined( HAVE_WINSOCK2 ) || defined( HAVE_WINSOCK )
        WSACleanup();
-#endif
-       SLAP_SOCK_SET_DESTROY;
+#endif /* HAVE_WINSOCK2 || HAVE_WINSOCK */
 
        return 0;
 }
@@ -2339,6 +2981,9 @@ static int sockdestroy(void)
 RETSIGTYPE
 slap_sig_shutdown( int sig )
 {
+       int save_errno = errno;
+       int i;
+
 #if 0
        Debug(LDAP_DEBUG_TRACE, "slap_sig_shutdown: signal %d\n", sig, 0, 0);
 #endif
@@ -2349,44 +2994,62 @@ slap_sig_shutdown( int sig )
         * SIGBREAK is generated when a user logs out.
         */
 
-#if HAVE_NT_SERVICE_MANAGER && SIGBREAK
+#if defined(HAVE_NT_SERVICE_MANAGER) && defined(SIGBREAK)
        if (is_NT_Service && sig == SIGBREAK) {
                /* empty */;
        } else
-#endif
+#endif /* HAVE_NT_SERVICE_MANAGER && SIGBREAK */
 #ifdef SIGHUP
        if (sig == SIGHUP && global_gentlehup && slapd_gentle_shutdown == 0) {
                slapd_gentle_shutdown = 1;
        } else
-#endif
+#endif /* SIGHUP */
        {
                slapd_shutdown = 1;
        }
 
-       WAKE_LISTENER(1);
+       for (i=0; i<slapd_daemon_threads; i++) {
+               WAKE_LISTENER(i,1);
+       }
 
        /* reinstall self */
        (void) SIGNAL_REINSTALL( sig, slap_sig_shutdown );
+
+       errno = save_errno;
 }
 
 RETSIGTYPE
 slap_sig_wake( int sig )
 {
-       WAKE_LISTENER(1);
+       int save_errno = errno;
+
+       WAKE_LISTENER(0,1);
 
        /* reinstall self */
        (void) SIGNAL_REINSTALL( sig, slap_sig_wake );
+
+       errno = save_errno;
 }
 
 
-void slapd_add_internal(ber_socket_t s, int isactive) {
-       slapd_add(s, isactive, NULL);
+void
+slapd_add_internal( ber_socket_t s, int isactive )
+{
+       slapd_add( s, isactive, NULL, -1 );
 }
 
-Listener ** slapd_get_listeners(void) {
+Listener **
+slapd_get_listeners( void )
+{
+       /* Could return array with no listeners if !listening, but current
+        * callers mostly look at the URLs.  E.g. syncrepl uses this to
+        * identify the server, which means it wants the startup arguments.
+        */
        return slap_listeners;
 }
 
-void slap_wake_listener() {
-       WAKE_LISTENER(1);
+void
+slap_wake_listener()
+{
+       WAKE_LISTENER(0,1);
 }