2007-04-09 06:03:06 -04:00
|
|
|
/*
|
|
|
|
|
* FD polling functions for FreeBSD kqueue()
|
|
|
|
|
*
|
MAJOR: polling: rework the whole polling system
This commit heavily changes the polling system in order to definitely
fix the frequent breakage of SSL which needs to remember the last
EAGAIN before deciding whether to poll or not. Now we have a state per
direction for each FD, as opposed to a previous and current state
previously. An FD can have up to 8 different states for each direction,
each of which being the result of a 3-bit combination. These 3 bits
indicate a wish to access the FD, the readiness of the FD and the
subscription of the FD to the polling system.
This means that it will now be possible to remember the state of a
file descriptor across disable/enable sequences that generally happen
during forwarding, where enabling reading on a previously disabled FD
would result in forgetting the EAGAIN flag it met last time.
Several new state manipulation functions have been introduced or
adapted :
- fd_want_{recv,send} : enable receiving/sending on the FD regardless
of its state (sets the ACTIVE flag) ;
- fd_stop_{recv,send} : stop receiving/sending on the FD regardless
of its state (clears the ACTIVE flag) ;
- fd_cant_{recv,send} : report a failure to receive/send on the FD
corresponding to EAGAIN (clears the READY flag) ;
- fd_may_{recv,send} : report the ability to receive/send on the FD
as reported by poll() (sets the READY flag) ;
Some functions are used to report the current FD status :
- fd_{recv,send}_active
- fd_{recv,send}_ready
- fd_{recv,send}_polled
Some functions were removed :
- fd_ev_clr(), fd_ev_set(), fd_ev_rem(), fd_ev_wai()
The POLLHUP/POLLERR flags are now reported as ready so that the I/O layers
knows it can try to access the file descriptor to get this information.
In order to simplify the conditions to add/remove cache entries, a new
function fd_alloc_or_release_cache_entry() was created to be used from
pollers while scanning for updates.
The following pollers have been updated :
ev_select() : done, built, tested on Linux 3.10
ev_poll() : done, built, tested on Linux 3.10
ev_epoll() : done, built, tested on Linux 3.10 & 3.13
ev_kqueue() : done, built, tested on OpenBSD 5.2
2014-01-10 10:58:45 -05:00
|
|
|
* Copyright 2000-2014 Willy Tarreau <w@1wt.eu>
|
2007-04-09 06:03:06 -04:00
|
|
|
*
|
|
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
|
* modify it under the terms of the GNU General Public License
|
|
|
|
|
* as published by the Free Software Foundation; either version
|
|
|
|
|
* 2 of the License, or (at your option) any later version.
|
|
|
|
|
*
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
#include <unistd.h>
|
|
|
|
|
#include <sys/time.h>
|
|
|
|
|
#include <sys/types.h>
|
|
|
|
|
|
|
|
|
|
#include <sys/event.h>
|
|
|
|
|
#include <sys/time.h>
|
|
|
|
|
|
|
|
|
|
#include <common/compat.h>
|
|
|
|
|
#include <common/config.h>
|
2008-07-06 18:09:58 -04:00
|
|
|
#include <common/ticks.h>
|
2007-04-09 06:03:06 -04:00
|
|
|
#include <common/time.h>
|
2007-06-03 11:16:49 -04:00
|
|
|
#include <common/tools.h>
|
2007-04-09 06:03:06 -04:00
|
|
|
|
|
|
|
|
#include <types/global.h>
|
|
|
|
|
|
|
|
|
|
#include <proto/fd.h>
|
2015-04-13 14:44:19 -04:00
|
|
|
|
2007-04-09 06:03:06 -04:00
|
|
|
|
|
|
|
|
/* private data */
|
|
|
|
|
static int kqueue_fd;
|
|
|
|
|
static struct kevent *kev = NULL;
|
|
|
|
|
|
|
|
|
|
/*
|
2012-11-11 14:49:49 -05:00
|
|
|
* kqueue() poller
|
2007-04-09 06:03:06 -04:00
|
|
|
*/
|
2012-11-11 14:49:49 -05:00
|
|
|
REGPRM2 static void _do_poll(struct poller *p, int exp)
|
2007-04-09 06:03:06 -04:00
|
|
|
{
|
2012-11-11 14:49:49 -05:00
|
|
|
int status;
|
|
|
|
|
int count, fd, delta_ms;
|
|
|
|
|
struct timespec timeout;
|
|
|
|
|
int updt_idx, en, eo;
|
|
|
|
|
int changes = 0;
|
2007-04-09 06:03:06 -04:00
|
|
|
|
2012-11-11 14:49:49 -05:00
|
|
|
/* first, scan the update list to find changes */
|
|
|
|
|
for (updt_idx = 0; updt_idx < fd_nbupdt; updt_idx++) {
|
|
|
|
|
fd = fd_updt[updt_idx];
|
MAJOR: polling: rework the whole polling system
This commit heavily changes the polling system in order to definitely
fix the frequent breakage of SSL which needs to remember the last
EAGAIN before deciding whether to poll or not. Now we have a state per
direction for each FD, as opposed to a previous and current state
previously. An FD can have up to 8 different states for each direction,
each of which being the result of a 3-bit combination. These 3 bits
indicate a wish to access the FD, the readiness of the FD and the
subscription of the FD to the polling system.
This means that it will now be possible to remember the state of a
file descriptor across disable/enable sequences that generally happen
during forwarding, where enabling reading on a previously disabled FD
would result in forgetting the EAGAIN flag it met last time.
Several new state manipulation functions have been introduced or
adapted :
- fd_want_{recv,send} : enable receiving/sending on the FD regardless
of its state (sets the ACTIVE flag) ;
- fd_stop_{recv,send} : stop receiving/sending on the FD regardless
of its state (clears the ACTIVE flag) ;
- fd_cant_{recv,send} : report a failure to receive/send on the FD
corresponding to EAGAIN (clears the READY flag) ;
- fd_may_{recv,send} : report the ability to receive/send on the FD
as reported by poll() (sets the READY flag) ;
Some functions are used to report the current FD status :
- fd_{recv,send}_active
- fd_{recv,send}_ready
- fd_{recv,send}_polled
Some functions were removed :
- fd_ev_clr(), fd_ev_set(), fd_ev_rem(), fd_ev_wai()
The POLLHUP/POLLERR flags are now reported as ready so that the I/O layers
knows it can try to access the file descriptor to get this information.
In order to simplify the conditions to add/remove cache entries, a new
function fd_alloc_or_release_cache_entry() was created to be used from
pollers while scanning for updates.
The following pollers have been updated :
ev_select() : done, built, tested on Linux 3.10
ev_poll() : done, built, tested on Linux 3.10
ev_epoll() : done, built, tested on Linux 3.10 & 3.13
ev_kqueue() : done, built, tested on OpenBSD 5.2
2014-01-10 10:58:45 -05:00
|
|
|
fdtab[fd].updated = 0;
|
|
|
|
|
fdtab[fd].new = 0;
|
|
|
|
|
|
|
|
|
|
if (!fdtab[fd].owner)
|
|
|
|
|
continue;
|
|
|
|
|
|
2014-01-25 04:32:56 -05:00
|
|
|
eo = fdtab[fd].state;
|
|
|
|
|
en = fd_compute_new_polled_status(eo);
|
MAJOR: polling: rework the whole polling system
This commit heavily changes the polling system in order to definitely
fix the frequent breakage of SSL which needs to remember the last
EAGAIN before deciding whether to poll or not. Now we have a state per
direction for each FD, as opposed to a previous and current state
previously. An FD can have up to 8 different states for each direction,
each of which being the result of a 3-bit combination. These 3 bits
indicate a wish to access the FD, the readiness of the FD and the
subscription of the FD to the polling system.
This means that it will now be possible to remember the state of a
file descriptor across disable/enable sequences that generally happen
during forwarding, where enabling reading on a previously disabled FD
would result in forgetting the EAGAIN flag it met last time.
Several new state manipulation functions have been introduced or
adapted :
- fd_want_{recv,send} : enable receiving/sending on the FD regardless
of its state (sets the ACTIVE flag) ;
- fd_stop_{recv,send} : stop receiving/sending on the FD regardless
of its state (clears the ACTIVE flag) ;
- fd_cant_{recv,send} : report a failure to receive/send on the FD
corresponding to EAGAIN (clears the READY flag) ;
- fd_may_{recv,send} : report the ability to receive/send on the FD
as reported by poll() (sets the READY flag) ;
Some functions are used to report the current FD status :
- fd_{recv,send}_active
- fd_{recv,send}_ready
- fd_{recv,send}_polled
Some functions were removed :
- fd_ev_clr(), fd_ev_set(), fd_ev_rem(), fd_ev_wai()
The POLLHUP/POLLERR flags are now reported as ready so that the I/O layers
knows it can try to access the file descriptor to get this information.
In order to simplify the conditions to add/remove cache entries, a new
function fd_alloc_or_release_cache_entry() was created to be used from
pollers while scanning for updates.
The following pollers have been updated :
ev_select() : done, built, tested on Linux 3.10
ev_poll() : done, built, tested on Linux 3.10
ev_epoll() : done, built, tested on Linux 3.10 & 3.13
ev_kqueue() : done, built, tested on OpenBSD 5.2
2014-01-10 10:58:45 -05:00
|
|
|
|
|
|
|
|
if ((eo ^ en) & FD_EV_POLLED_RW) {
|
|
|
|
|
/* poll status changed */
|
|
|
|
|
fdtab[fd].state = en;
|
2012-11-11 14:49:49 -05:00
|
|
|
|
|
|
|
|
if ((eo ^ en) & FD_EV_POLLED_R) {
|
|
|
|
|
/* read poll status changed */
|
|
|
|
|
if (en & FD_EV_POLLED_R) {
|
|
|
|
|
EV_SET(&kev[changes], fd, EVFILT_READ, EV_ADD, 0, 0, NULL);
|
|
|
|
|
changes++;
|
|
|
|
|
}
|
|
|
|
|
else {
|
|
|
|
|
EV_SET(&kev[changes], fd, EVFILT_READ, EV_DELETE, 0, 0, NULL);
|
|
|
|
|
changes++;
|
|
|
|
|
}
|
|
|
|
|
}
|
2007-04-09 06:03:06 -04:00
|
|
|
|
2012-11-11 14:49:49 -05:00
|
|
|
if ((eo ^ en) & FD_EV_POLLED_W) {
|
|
|
|
|
/* write poll status changed */
|
|
|
|
|
if (en & FD_EV_POLLED_W) {
|
|
|
|
|
EV_SET(&kev[changes], fd, EVFILT_WRITE, EV_ADD, 0, 0, NULL);
|
|
|
|
|
changes++;
|
|
|
|
|
}
|
|
|
|
|
else {
|
|
|
|
|
EV_SET(&kev[changes], fd, EVFILT_WRITE, EV_DELETE, 0, 0, NULL);
|
|
|
|
|
changes++;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
2007-04-09 06:03:06 -04:00
|
|
|
if (changes)
|
|
|
|
|
kevent(kqueue_fd, kev, changes, NULL, 0, NULL);
|
2012-11-11 14:49:49 -05:00
|
|
|
fd_nbupdt = 0;
|
2007-04-09 06:03:06 -04:00
|
|
|
|
2008-07-06 18:09:58 -04:00
|
|
|
delta_ms = 0;
|
|
|
|
|
timeout.tv_sec = 0;
|
|
|
|
|
timeout.tv_nsec = 0;
|
|
|
|
|
|
2015-04-13 14:44:19 -04:00
|
|
|
if (!exp) {
|
|
|
|
|
delta_ms = MAX_DELAY_MS;
|
|
|
|
|
timeout.tv_sec = (MAX_DELAY_MS / 1000);
|
|
|
|
|
timeout.tv_nsec = (MAX_DELAY_MS % 1000) * 1000000;
|
|
|
|
|
}
|
|
|
|
|
else if (!tick_is_expired(exp, now_ms)) {
|
|
|
|
|
delta_ms = TICKS_TO_MS(tick_remain(now_ms, exp)) + 1;
|
|
|
|
|
if (delta_ms > MAX_DELAY_MS)
|
|
|
|
|
delta_ms = MAX_DELAY_MS;
|
|
|
|
|
timeout.tv_sec = (delta_ms / 1000);
|
|
|
|
|
timeout.tv_nsec = (delta_ms % 1000) * 1000000;
|
2007-04-09 10:25:46 -04:00
|
|
|
}
|
2007-04-09 06:03:06 -04:00
|
|
|
|
2007-06-03 11:16:49 -04:00
|
|
|
fd = MIN(maxfd, global.tune.maxpollevents);
|
2011-09-10 10:56:42 -04:00
|
|
|
gettimeofday(&before_poll, NULL);
|
2007-04-09 06:03:06 -04:00
|
|
|
status = kevent(kqueue_fd, // int kq
|
|
|
|
|
NULL, // const struct kevent *changelist
|
|
|
|
|
0, // int nchanges
|
|
|
|
|
kev, // struct kevent *eventlist
|
2007-06-03 11:16:49 -04:00
|
|
|
fd, // int nevents
|
2008-06-23 08:00:57 -04:00
|
|
|
&timeout); // const struct timespec *timeout
|
|
|
|
|
tv_update_date(delta_ms, status);
|
2011-09-10 10:56:42 -04:00
|
|
|
measure_idle();
|
2007-04-09 06:03:06 -04:00
|
|
|
|
|
|
|
|
for (count = 0; count < status; count++) {
|
2017-08-30 04:34:36 -04:00
|
|
|
unsigned int n = 0;
|
2007-04-09 06:03:06 -04:00
|
|
|
fd = kev[count].ident;
|
2012-07-06 05:44:28 -04:00
|
|
|
|
2012-07-06 10:02:29 -04:00
|
|
|
if (!fdtab[fd].owner)
|
|
|
|
|
continue;
|
|
|
|
|
|
2007-04-09 06:03:06 -04:00
|
|
|
if (kev[count].filter == EVFILT_READ) {
|
2017-03-13 15:49:56 -04:00
|
|
|
if (kev[count].data)
|
2017-08-30 04:34:36 -04:00
|
|
|
n |= FD_POLL_IN;
|
2017-03-13 15:36:48 -04:00
|
|
|
if (kev[count].flags & EV_EOF)
|
2017-08-30 04:34:36 -04:00
|
|
|
n |= FD_POLL_HUP;
|
2012-11-11 14:49:49 -05:00
|
|
|
}
|
|
|
|
|
else if (kev[count].filter == EVFILT_WRITE) {
|
2017-08-30 04:34:36 -04:00
|
|
|
n |= FD_POLL_OUT;
|
2017-03-13 15:36:48 -04:00
|
|
|
if (kev[count].flags & EV_EOF)
|
2017-08-30 04:34:36 -04:00
|
|
|
n |= FD_POLL_ERR;
|
2007-04-09 06:03:06 -04:00
|
|
|
}
|
2012-11-11 14:49:49 -05:00
|
|
|
|
2017-08-30 04:34:36 -04:00
|
|
|
fd_update_events(fd, n);
|
2007-04-09 06:03:06 -04:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* Initialization of the kqueue() poller.
|
|
|
|
|
* Returns 0 in case of failure, non-zero in case of success. If it fails, it
|
|
|
|
|
* disables the poller by setting its pref to 0.
|
|
|
|
|
*/
|
2007-04-15 18:25:25 -04:00
|
|
|
REGPRM1 static int _do_init(struct poller *p)
|
2007-04-09 06:03:06 -04:00
|
|
|
{
|
|
|
|
|
p->private = NULL;
|
|
|
|
|
|
|
|
|
|
kqueue_fd = kqueue();
|
|
|
|
|
if (kqueue_fd < 0)
|
|
|
|
|
goto fail_fd;
|
|
|
|
|
|
2012-11-11 14:49:49 -05:00
|
|
|
/* we can have up to two events per fd (*/
|
2016-04-03 07:48:42 -04:00
|
|
|
kev = calloc(1, sizeof(struct kevent) * 2 * global.maxsock);
|
2007-04-09 06:03:06 -04:00
|
|
|
if (kev == NULL)
|
|
|
|
|
goto fail_kev;
|
|
|
|
|
|
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
|
|
fail_kev:
|
|
|
|
|
close(kqueue_fd);
|
2009-05-10 04:18:54 -04:00
|
|
|
kqueue_fd = -1;
|
2007-04-09 06:03:06 -04:00
|
|
|
fail_fd:
|
|
|
|
|
p->pref = 0;
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* Termination of the kqueue() poller.
|
|
|
|
|
* Memory is released and the poller is marked as unselectable.
|
|
|
|
|
*/
|
2007-04-15 18:25:25 -04:00
|
|
|
REGPRM1 static void _do_term(struct poller *p)
|
2007-04-09 06:03:06 -04:00
|
|
|
{
|
2008-08-03 06:19:50 -04:00
|
|
|
free(kev);
|
2009-05-10 04:18:54 -04:00
|
|
|
|
|
|
|
|
if (kqueue_fd >= 0) {
|
|
|
|
|
close(kqueue_fd);
|
|
|
|
|
kqueue_fd = -1;
|
|
|
|
|
}
|
2007-04-09 06:03:06 -04:00
|
|
|
|
|
|
|
|
p->private = NULL;
|
|
|
|
|
p->pref = 0;
|
|
|
|
|
}
|
|
|
|
|
|
2007-04-09 13:29:56 -04:00
|
|
|
/*
|
|
|
|
|
* Check that the poller works.
|
|
|
|
|
* Returns 1 if OK, otherwise 0.
|
|
|
|
|
*/
|
2007-04-15 18:25:25 -04:00
|
|
|
REGPRM1 static int _do_test(struct poller *p)
|
2007-04-09 13:29:56 -04:00
|
|
|
{
|
|
|
|
|
int fd;
|
|
|
|
|
|
|
|
|
|
fd = kqueue();
|
|
|
|
|
if (fd < 0)
|
|
|
|
|
return 0;
|
|
|
|
|
close(fd);
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* Recreate the kqueue file descriptor after a fork(). Returns 1 if OK,
|
|
|
|
|
* otherwise 0. Note that some pollers need to be reopened after a fork()
|
|
|
|
|
* (such as kqueue), and some others may fail to do so in a chroot.
|
|
|
|
|
*/
|
2007-04-15 18:25:25 -04:00
|
|
|
REGPRM1 static int _do_fork(struct poller *p)
|
2007-04-09 13:29:56 -04:00
|
|
|
{
|
2009-05-10 04:18:54 -04:00
|
|
|
if (kqueue_fd >= 0)
|
|
|
|
|
close(kqueue_fd);
|
2007-04-09 13:29:56 -04:00
|
|
|
kqueue_fd = kqueue();
|
|
|
|
|
if (kqueue_fd < 0)
|
|
|
|
|
return 0;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
2007-04-09 06:03:06 -04:00
|
|
|
/*
|
2007-04-15 18:25:25 -04:00
|
|
|
* It is a constructor, which means that it will automatically be called before
|
|
|
|
|
* main(). This is GCC-specific but it works at least since 2.95.
|
|
|
|
|
* Special care must be taken so that it does not need any uninitialized data.
|
2007-04-09 06:03:06 -04:00
|
|
|
*/
|
2007-04-15 18:25:25 -04:00
|
|
|
__attribute__((constructor))
|
|
|
|
|
static void _do_register(void)
|
2007-04-09 06:03:06 -04:00
|
|
|
{
|
2007-04-15 18:25:25 -04:00
|
|
|
struct poller *p;
|
|
|
|
|
|
|
|
|
|
if (nbpollers >= MAX_POLLERS)
|
|
|
|
|
return;
|
2009-05-10 04:18:54 -04:00
|
|
|
|
|
|
|
|
kqueue_fd = -1;
|
2007-04-15 18:25:25 -04:00
|
|
|
p = &pollers[nbpollers++];
|
|
|
|
|
|
2007-04-09 06:03:06 -04:00
|
|
|
p->name = "kqueue";
|
|
|
|
|
p->pref = 300;
|
2017-03-13 15:36:48 -04:00
|
|
|
p->flags = HAP_POLL_F_RDHUP;
|
2007-04-09 06:03:06 -04:00
|
|
|
p->private = NULL;
|
|
|
|
|
|
2012-11-11 15:02:34 -05:00
|
|
|
p->clo = NULL;
|
2007-04-15 18:25:25 -04:00
|
|
|
p->test = _do_test;
|
|
|
|
|
p->init = _do_init;
|
|
|
|
|
p->term = _do_term;
|
|
|
|
|
p->poll = _do_poll;
|
|
|
|
|
p->fork = _do_fork;
|
2007-04-09 06:03:06 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* Local variables:
|
|
|
|
|
* c-indent-level: 8
|
|
|
|
|
* c-basic-offset: 8
|
|
|
|
|
* End:
|
|
|
|
|
*/
|