X-Git-Url: http://git.pk910.de/?p=ircu2.10.12-pk.git;a=blobdiff_plain;f=ircd%2Fengine_kqueue.c;fp=ircd%2Fengine_kqueue.c;h=a0d00dd645b5d35a49e3f350e142732f4d0cfb34;hp=0000000000000000000000000000000000000000;hb=0400a5a6479398d82526785c18c0df8bc8b92dce;hpb=d17e10da972ce5776c60b4c317267c6abe0e1ead diff --git a/ircd/engine_kqueue.c b/ircd/engine_kqueue.c new file mode 100644 index 0000000..a0d00dd --- /dev/null +++ b/ircd/engine_kqueue.c @@ -0,0 +1,449 @@ +/* + * IRC - Internet Relay Chat, ircd/engine_kqueue.c + * Copyright (C) 2001 Kevin L. Mitchell + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 1, or (at your option) + * any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. + */ +/** @file + * @brief FreeBSD kqueue()/kevent() event engine. + * @version $Id$ + */ +#include "config.h" + +#include "ircd_events.h" + +#include "ircd.h" +#include "ircd_alloc.h" +#include "ircd_features.h" +#include "ircd_log.h" +#include "s_debug.h" + +/* #include -- Now using assert in ircd_log.h */ +#include +#include +#include +#include +#include +#include +#include +#include + +#define KQUEUE_ERROR_THRESHOLD 20 /**< after 20 kqueue errors, restart */ +#define ERROR_EXPIRE_TIME 3600 /**< expire errors after an hour */ + +/** Array of active Socket structures, indexed by file descriptor. */ +static struct Socket** sockList; +/** Maximum file descriptor supported, plus one. */ +static int kqueue_max; +/** File descriptor for kqueue pseudo-file. */ +static int kqueue_id; +/** Current array of event descriptors. */ +static struct kevent *events; +/** Number of ::events elements that have been populated. */ +static int events_used; + +/** Number of recent errors from kqueue. */ +static int errors = 0; +/** Periodic timer to forget errors. */ +static struct Timer clear_error; + +/** Decrement the error count (once per hour). + * @param[in] ev Expired timer event (ignored). + */ +static void +error_clear(struct Event* ev) +{ + if (!--errors) /* remove timer when error count reaches 0 */ + timer_del(ev_timer(ev)); +} + +/** Initialize the kqueue engine. + * @param[in] max_sockets Maximum number of file descriptors to support. + * @return Non-zero on success, or zero on failure. + */ +static int +engine_init(int max_sockets) +{ + int i; + + if ((kqueue_id = kqueue()) < 0) { /* initialize... */ + log_write(LS_SYSTEM, L_WARNING, 0, + "kqueue() engine cannot initialize: %m"); + return 0; + } + + /* allocate necessary memory */ + sockList = (struct Socket**) MyMalloc(sizeof(struct Socket*) * max_sockets); + + /* initialize the data */ + for (i = 0; i < max_sockets; i++) + sockList[i] = 0; + + kqueue_max = max_sockets; /* number of sockets allocated */ + + return 1; /* success! */ +} + +/** Add a signal to the event engine. + * @param[in] sig Signal to add to engine. + */ +static void +engine_signal(struct Signal* sig) +{ + struct kevent sigevent; + struct sigaction act; + + assert(0 != sig); + + Debug((DEBUG_ENGINE, "kqueue: Adding filter for signal %d [%p]", + sig_signal(sig), sig)); + + sigevent.ident = sig_signal(sig); /* set up the kqueue event */ + sigevent.filter = EVFILT_SIGNAL; /* looking for signals... */ + sigevent.flags = EV_ADD | EV_ENABLE; /* add and enable it */ + sigevent.fflags = 0; + sigevent.data = 0; + sigevent.udata = sig; /* store our user data */ + + if (kevent(kqueue_id, &sigevent, 1, 0, 0, 0) < 0) { /* add event */ + log_write(LS_SYSTEM, L_WARNING, 0, "Unable to trap signal %d", + sig_signal(sig)); + return; + } + + act.sa_handler = SIG_IGN; /* ignore the signal */ + act.sa_flags = 0; + sigemptyset(&act.sa_mask); + sigaction(sig_signal(sig), &act, 0); +} + +/** Figure out what events go with a given state. + * @param[in] state %Socket state to consider. + * @param[in] events User-specified preferred event set. + * @return Actual set of preferred events. + */ +static unsigned int +state_to_events(enum SocketState state, unsigned int events) +{ + switch (state) { + case SS_CONNECTING: /* connecting socket */ + return SOCK_EVENT_WRITABLE; + break; + + case SS_LISTENING: /* listening socket */ + case SS_NOTSOCK: /* our signal socket--just in case */ + return SOCK_EVENT_READABLE; + break; + + case SS_CONNECTED: case SS_DATAGRAM: case SS_CONNECTDG: + return events; /* ordinary socket */ + break; + } + + /*NOTREACHED*/ + return 0; +} + +/** Activate kqueue filters as appropriate. + * @param[in] sock Socket structure to operate on. + * @param[in] clear Set of interest events to clear from socket. + * @param[in] set Set of interest events to set on socket. + */ +static void +set_or_clear(struct Socket* sock, unsigned int clear, unsigned int set) +{ + int i = 0; + struct kevent chglist[2]; + + assert(0 != sock); + assert(-1 < s_fd(sock)); + + if ((clear ^ set) & SOCK_EVENT_READABLE) { /* readable has changed */ + chglist[i].ident = s_fd(sock); /* set up the change list */ + chglist[i].filter = EVFILT_READ; /* readable filter */ + chglist[i].flags = EV_ADD; /* adding it */ + chglist[i].fflags = 0; + chglist[i].data = 0; + chglist[i].udata = 0; /* I love udata, but it can't really be used here */ + + if (set & SOCK_EVENT_READABLE) /* it's set */ + chglist[i].flags |= EV_ENABLE; + else /* clear it */ + chglist[i].flags |= EV_DISABLE; + + i++; /* advance to next element */ + } + + if ((clear ^ set) & SOCK_EVENT_WRITABLE) { /* writable has changed */ + chglist[i].ident = s_fd(sock); /* set up the change list */ + chglist[i].filter = EVFILT_WRITE; /* writable filter */ + chglist[i].flags = EV_ADD; /* adding it */ + chglist[i].fflags = 0; + chglist[i].data = 0; + chglist[i].udata = 0; + + if (set & SOCK_EVENT_WRITABLE) /* it's set */ + chglist[i].flags |= EV_ENABLE; + else /* clear it */ + chglist[i].flags |= EV_DISABLE; + + i++; /* advance count... */ + } + + if (kevent(kqueue_id, chglist, i, 0, 0, 0) < 0 && errno != EBADF) + event_generate(ET_ERROR, sock, errno); /* report error */ +} + +/** Add a socket to the event engine. + * @param[in] sock Socket to add to engine. + * @return Non-zero on success, or zero on error. + */ +static int +engine_add(struct Socket* sock) +{ + assert(0 != sock); + assert(0 == sockList[s_fd(sock)]); + + /* bounds-check... */ + if (sock->s_fd >= kqueue_max) { + log_write(LS_SYSTEM, L_ERROR, 0, + "Attempt to add socket %d (> %d) to event engine", s_fd(sock), + kqueue_max); + return 0; + } + + sockList[s_fd(sock)] = sock; /* add to list */ + + Debug((DEBUG_ENGINE, "kqueue: Adding socket %d [%p], state %s, to engine", + s_fd(sock), sock, state_to_name(s_state(sock)))); + + /* Add socket to queue */ + set_or_clear(sock, 0, state_to_events(s_state(sock), s_events(sock))); + + return 1; /* success */ +} + +/** Handle state transition for a socket. + * @param[in] sock Socket changing state. + * @param[in] new_state New state for socket. + */ +static void +engine_state(struct Socket* sock, enum SocketState new_state) +{ + assert(0 != sock); + assert(sock == sockList[s_fd(sock)]); + + Debug((DEBUG_ENGINE, "kqueue: Changing state for socket %p to %s", sock, + state_to_name(new_state))); + + /* set the correct events */ + set_or_clear(sock, + state_to_events(s_state(sock), s_events(sock)), /* old state */ + state_to_events(new_state, s_events(sock))); /* new state */ + +} + +/** Handle change to preferred socket events. + * @param[in] sock Socket getting new interest list. + * @param[in] new_events New set of interesting events for socket. + */ +static void +engine_events(struct Socket* sock, unsigned int new_events) +{ + assert(0 != sock); + assert(sock == sockList[s_fd(sock)]); + + Debug((DEBUG_ENGINE, "kqueue: Changing event mask for socket %p to [%s]", + sock, sock_flags(new_events))); + + /* set the correct events */ + set_or_clear(sock, + state_to_events(s_state(sock), s_events(sock)), /* old events */ + state_to_events(s_state(sock), new_events)); /* new events */ +} + +/** Remove a socket from the event engine. + * @param[in] sock Socket being destroyed. + */ +static void +engine_delete(struct Socket* sock) +{ + int ii; + + assert(0 != sock); + assert(sock == sockList[s_fd(sock)]); + + Debug((DEBUG_ENGINE, "kqueue: Deleting socket %d [%p], state %s", + s_fd(sock), sock, state_to_name(s_state(sock)))); + + sockList[s_fd(sock)] = 0; + + /* Drop any unprocessed events citing this socket. */ + for (ii = 0; ii < events_used; ii++) { + if (events[ii].ident == s_fd(sock)) { + events[ii] = events[--events_used]; + } + } +} + +/** Run engine event loop. + * @param[in] gen Lists of generators of various types. + */ +static void +engine_loop(struct Generators* gen) +{ + int events_count; + struct kevent *evt; + struct Socket* sock; + struct timespec wait; + int i; + int errcode; + socklen_t codesize; + + if ((events_count = feature_int(FEAT_POLLS_PER_LOOP)) < 20) + events_count = 20; + events = (struct kevent *)MyMalloc(sizeof(struct kevent) * events_count); + + while (running) { + if ((i = feature_int(FEAT_POLLS_PER_LOOP)) >= 20 && i != events_count) { + events = (struct kevent *)MyRealloc(events, sizeof(struct kevent) * i); + events_count = i; + } + + /* set up the sleep time */ + wait.tv_sec = timer_next(gen) ? (timer_next(gen) - CurrentTime) : -1; + wait.tv_nsec = 0; + + Debug((DEBUG_ENGINE, "kqueue: delay: %Tu (%Tu) %Tu", timer_next(gen), + CurrentTime, wait.tv_sec)); + + /* check for active events */ + events_used = kevent(kqueue_id, 0, 0, events, events_count, + wait.tv_sec < 0 ? 0 : &wait); + + CurrentTime = time(0); /* set current time... */ + + if (events_used < 0) { + if (errno != EINTR) { /* ignore kevent interrupts */ + /* Log the kqueue error */ + log_write(LS_SOCKET, L_ERROR, 0, "kevent() error: %m"); + if (!errors++) + timer_add(timer_init(&clear_error), error_clear, 0, TT_PERIODIC, + ERROR_EXPIRE_TIME); + else if (errors > KQUEUE_ERROR_THRESHOLD) /* too many errors... */ + server_restart("too many kevent errors"); + } + /* old code did a sleep(1) here; with usage these days, + * that may be too expensive + */ + continue; + } + + while (events_used > 0) { + evt = &events[--events_used]; + + if (evt->filter == EVFILT_SIGNAL) { + /* it's a signal; deal appropriately */ + event_generate(ET_SIGNAL, evt->udata, evt->ident); + continue; /* skip socket processing loop */ + } + + assert(evt->filter == EVFILT_READ || evt->filter == EVFILT_WRITE); + + sock = sockList[evt->ident]; + if (!sock) /* slots may become empty while processing events */ + continue; + + assert(s_fd(sock) == evt->ident); + + gen_ref_inc(sock); /* can't have it going away on us */ + + Debug((DEBUG_ENGINE, "kqueue: Checking socket %p (fd %d) state %s, " + "events %s", sock, s_fd(sock), state_to_name(s_state(sock)), + sock_flags(s_events(sock)))); + + if (s_state(sock) != SS_NOTSOCK) { + errcode = 0; /* check for errors on socket */ + codesize = sizeof(errcode); + if (getsockopt(s_fd(sock), SOL_SOCKET, SO_ERROR, &errcode, + &codesize) < 0) + errcode = errno; /* work around Solaris implementation */ + + if (errcode) { /* an error occurred; generate an event */ + Debug((DEBUG_ENGINE, "kqueue: Error %d on fd %d, socket %p", errcode, + s_fd(sock), sock)); + event_generate(ET_ERROR, sock, errcode); + gen_ref_dec(sock); /* careful not to leak reference counts */ + continue; + } + } + + switch (s_state(sock)) { + case SS_CONNECTING: + if (evt->filter == EVFILT_WRITE) { /* connection completed */ + Debug((DEBUG_ENGINE, "kqueue: Connection completed")); + event_generate(ET_CONNECT, sock, 0); + } + break; + + case SS_LISTENING: + if (evt->filter == EVFILT_READ) { /* connect. to be accept. */ + Debug((DEBUG_ENGINE, "kqueue: Ready for accept")); + event_generate(ET_ACCEPT, sock, 0); + } + break; + + case SS_NOTSOCK: /* doing nothing socket-specific */ + case SS_CONNECTED: + if (evt->filter == EVFILT_READ) { /* data on socket */ + Debug((DEBUG_ENGINE, "kqueue: EOF or data to be read")); + event_generate(evt->flags & EV_EOF ? ET_EOF : ET_READ, sock, 0); + } + if (evt->filter == EVFILT_WRITE) { /* socket writable */ + Debug((DEBUG_ENGINE, "kqueue: Data can be written")); + event_generate(ET_WRITE, sock, 0); + } + break; + + case SS_DATAGRAM: case SS_CONNECTDG: + if (evt->filter == EVFILT_READ) { /* socket readable */ + Debug((DEBUG_ENGINE, "kqueue: Datagram to be read")); + event_generate(ET_READ, sock, 0); + } + if (evt->filter == EVFILT_WRITE) { /* socket writable */ + Debug((DEBUG_ENGINE, "kqueue: Datagram can be written")); + event_generate(ET_WRITE, sock, 0); + } + break; + } + + gen_ref_dec(sock); /* we're done with it */ + } + + timer_run(); /* execute any pending timers */ + } +} + +/** Descriptor for kqueue() event engine. */ +struct Engine engine_kqueue = { + "kqueue()", /* Engine name */ + engine_init, /* Engine initialization function */ + engine_signal, /* Engine signal registration function */ + engine_add, /* Engine socket registration function */ + engine_state, /* Engine socket state change function */ + engine_events, /* Engine socket events mask function */ + engine_delete, /* Engine socket deletion function */ + engine_loop /* Core engine event loop */ +};