2007-04-08 14:39:58 +00:00
|
|
|
/*
|
|
|
|
* FD polling functions for generic select()
|
|
|
|
*
|
MAJOR: polling: rework the whole polling system
This commit heavily changes the polling system in order to definitely
fix the frequent breakage of SSL which needs to remember the last
EAGAIN before deciding whether to poll or not. Now we have a state per
direction for each FD, as opposed to a previous and current state
previously. An FD can have up to 8 different states for each direction,
each of which being the result of a 3-bit combination. These 3 bits
indicate a wish to access the FD, the readiness of the FD and the
subscription of the FD to the polling system.
This means that it will now be possible to remember the state of a
file descriptor across disable/enable sequences that generally happen
during forwarding, where enabling reading on a previously disabled FD
would result in forgetting the EAGAIN flag it met last time.
Several new state manipulation functions have been introduced or
adapted :
- fd_want_{recv,send} : enable receiving/sending on the FD regardless
of its state (sets the ACTIVE flag) ;
- fd_stop_{recv,send} : stop receiving/sending on the FD regardless
of its state (clears the ACTIVE flag) ;
- fd_cant_{recv,send} : report a failure to receive/send on the FD
corresponding to EAGAIN (clears the READY flag) ;
- fd_may_{recv,send} : report the ability to receive/send on the FD
as reported by poll() (sets the READY flag) ;
Some functions are used to report the current FD status :
- fd_{recv,send}_active
- fd_{recv,send}_ready
- fd_{recv,send}_polled
Some functions were removed :
- fd_ev_clr(), fd_ev_set(), fd_ev_rem(), fd_ev_wai()
The POLLHUP/POLLERR flags are now reported as ready so that the I/O layers
knows it can try to access the file descriptor to get this information.
In order to simplify the conditions to add/remove cache entries, a new
function fd_alloc_or_release_cache_entry() was created to be used from
pollers while scanning for updates.
The following pollers have been updated :
ev_select() : done, built, tested on Linux 3.10
ev_poll() : done, built, tested on Linux 3.10
ev_epoll() : done, built, tested on Linux 3.10 & 3.13
ev_kqueue() : done, built, tested on OpenBSD 5.2
2014-01-10 15:58:45 +00:00
|
|
|
* Copyright 2000-2014 Willy Tarreau <w@1wt.eu>
|
2007-04-08 14:39:58 +00:00
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public License
|
|
|
|
* as published by the Free Software Foundation; either version
|
|
|
|
* 2 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <unistd.h>
|
|
|
|
#include <sys/time.h>
|
|
|
|
#include <sys/types.h>
|
|
|
|
|
|
|
|
#include <common/compat.h>
|
|
|
|
#include <common/config.h>
|
2018-08-02 08:16:17 +00:00
|
|
|
#include <common/hathreads.h>
|
2008-07-06 22:09:58 +00:00
|
|
|
#include <common/ticks.h>
|
2007-04-08 14:39:58 +00:00
|
|
|
#include <common/time.h>
|
|
|
|
|
|
|
|
#include <types/global.h>
|
|
|
|
|
|
|
|
#include <proto/fd.h>
|
|
|
|
|
|
|
|
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
/* private data */
|
2018-01-26 20:48:23 +00:00
|
|
|
static int maxfd; /* # of the highest fd + 1 */
|
2018-01-25 15:48:46 +00:00
|
|
|
static unsigned int *fd_evts[2];
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
static THREAD_LOCAL fd_set *tmp_evts[2];
|
2007-04-08 14:39:58 +00:00
|
|
|
|
2012-11-11 15:53:50 +00:00
|
|
|
/* Immediately remove the entry upon close() */
|
|
|
|
REGPRM1 static void __fd_clo(int fd)
|
2007-04-08 14:39:58 +00:00
|
|
|
{
|
2018-01-25 15:48:46 +00:00
|
|
|
hap_fd_clr(fd, fd_evts[DIR_RD]);
|
|
|
|
hap_fd_clr(fd, fd_evts[DIR_WR]);
|
2007-04-08 14:39:58 +00:00
|
|
|
}
|
|
|
|
|
2018-04-25 14:58:25 +00:00
|
|
|
static void _update_fd(int fd, int *max_add_fd)
|
|
|
|
{
|
|
|
|
int en;
|
|
|
|
|
|
|
|
en = fdtab[fd].state;
|
|
|
|
|
|
|
|
/* we have a single state for all threads, which is why we
|
|
|
|
* don't check the tid_bit. First thread to see the update
|
|
|
|
* takes it for every other one.
|
|
|
|
*/
|
|
|
|
if (!(en & FD_EV_POLLED_RW)) {
|
2018-04-26 12:23:07 +00:00
|
|
|
if (!polled_mask[fd]) {
|
2018-04-25 14:58:25 +00:00
|
|
|
/* fd was not watched, it's still not */
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
/* fd totally removed from poll list */
|
|
|
|
hap_fd_clr(fd, fd_evts[DIR_RD]);
|
|
|
|
hap_fd_clr(fd, fd_evts[DIR_WR]);
|
2018-04-26 12:23:07 +00:00
|
|
|
HA_ATOMIC_AND(&polled_mask[fd], 0);
|
2018-04-25 14:58:25 +00:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
/* OK fd has to be monitored, it was either added or changed */
|
|
|
|
if (!(en & FD_EV_POLLED_R))
|
|
|
|
hap_fd_clr(fd, fd_evts[DIR_RD]);
|
|
|
|
else
|
|
|
|
hap_fd_set(fd, fd_evts[DIR_RD]);
|
|
|
|
|
|
|
|
if (!(en & FD_EV_POLLED_W))
|
|
|
|
hap_fd_clr(fd, fd_evts[DIR_WR]);
|
|
|
|
else
|
|
|
|
hap_fd_set(fd, fd_evts[DIR_WR]);
|
|
|
|
|
2018-04-26 12:23:07 +00:00
|
|
|
HA_ATOMIC_OR(&polled_mask[fd], tid_bit);
|
2018-04-25 14:58:25 +00:00
|
|
|
if (fd > *max_add_fd)
|
|
|
|
*max_add_fd = fd;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2007-04-08 14:39:58 +00:00
|
|
|
/*
|
|
|
|
* Select() poller
|
|
|
|
*/
|
2008-07-06 22:09:58 +00:00
|
|
|
REGPRM2 static void _do_poll(struct poller *p, int exp)
|
2007-04-08 14:39:58 +00:00
|
|
|
{
|
|
|
|
int status;
|
|
|
|
int fd, i;
|
|
|
|
struct timeval delta;
|
2008-06-23 12:00:57 +00:00
|
|
|
int delta_ms;
|
2007-04-08 14:39:58 +00:00
|
|
|
int fds;
|
2018-04-25 14:58:25 +00:00
|
|
|
int updt_idx;
|
2007-04-08 14:39:58 +00:00
|
|
|
char count;
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
int readnotnull, writenotnull;
|
2018-01-26 20:48:23 +00:00
|
|
|
int old_maxfd, new_maxfd, max_add_fd;
|
2018-04-25 14:58:25 +00:00
|
|
|
int old_fd;
|
2018-01-26 20:48:23 +00:00
|
|
|
|
|
|
|
max_add_fd = -1;
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
|
2012-11-11 15:53:50 +00:00
|
|
|
/* first, scan the update list to find changes */
|
|
|
|
for (updt_idx = 0; updt_idx < fd_nbupdt; updt_idx++) {
|
|
|
|
fd = fd_updt[updt_idx];
|
MAJOR: polling: rework the whole polling system
This commit heavily changes the polling system in order to definitely
fix the frequent breakage of SSL which needs to remember the last
EAGAIN before deciding whether to poll or not. Now we have a state per
direction for each FD, as opposed to a previous and current state
previously. An FD can have up to 8 different states for each direction,
each of which being the result of a 3-bit combination. These 3 bits
indicate a wish to access the FD, the readiness of the FD and the
subscription of the FD to the polling system.
This means that it will now be possible to remember the state of a
file descriptor across disable/enable sequences that generally happen
during forwarding, where enabling reading on a previously disabled FD
would result in forgetting the EAGAIN flag it met last time.
Several new state manipulation functions have been introduced or
adapted :
- fd_want_{recv,send} : enable receiving/sending on the FD regardless
of its state (sets the ACTIVE flag) ;
- fd_stop_{recv,send} : stop receiving/sending on the FD regardless
of its state (clears the ACTIVE flag) ;
- fd_cant_{recv,send} : report a failure to receive/send on the FD
corresponding to EAGAIN (clears the READY flag) ;
- fd_may_{recv,send} : report the ability to receive/send on the FD
as reported by poll() (sets the READY flag) ;
Some functions are used to report the current FD status :
- fd_{recv,send}_active
- fd_{recv,send}_ready
- fd_{recv,send}_polled
Some functions were removed :
- fd_ev_clr(), fd_ev_set(), fd_ev_rem(), fd_ev_wai()
The POLLHUP/POLLERR flags are now reported as ready so that the I/O layers
knows it can try to access the file descriptor to get this information.
In order to simplify the conditions to add/remove cache entries, a new
function fd_alloc_or_release_cache_entry() was created to be used from
pollers while scanning for updates.
The following pollers have been updated :
ev_select() : done, built, tested on Linux 3.10
ev_poll() : done, built, tested on Linux 3.10
ev_epoll() : done, built, tested on Linux 3.10 & 3.13
ev_kqueue() : done, built, tested on OpenBSD 5.2
2014-01-10 15:58:45 +00:00
|
|
|
|
2018-04-03 17:06:18 +00:00
|
|
|
HA_ATOMIC_AND(&fdtab[fd].update_mask, ~tid_bit);
|
2018-01-20 18:30:13 +00:00
|
|
|
if (!fdtab[fd].owner) {
|
|
|
|
activity[tid].poll_drop++;
|
MAJOR: polling: rework the whole polling system
This commit heavily changes the polling system in order to definitely
fix the frequent breakage of SSL which needs to remember the last
EAGAIN before deciding whether to poll or not. Now we have a state per
direction for each FD, as opposed to a previous and current state
previously. An FD can have up to 8 different states for each direction,
each of which being the result of a 3-bit combination. These 3 bits
indicate a wish to access the FD, the readiness of the FD and the
subscription of the FD to the polling system.
This means that it will now be possible to remember the state of a
file descriptor across disable/enable sequences that generally happen
during forwarding, where enabling reading on a previously disabled FD
would result in forgetting the EAGAIN flag it met last time.
Several new state manipulation functions have been introduced or
adapted :
- fd_want_{recv,send} : enable receiving/sending on the FD regardless
of its state (sets the ACTIVE flag) ;
- fd_stop_{recv,send} : stop receiving/sending on the FD regardless
of its state (clears the ACTIVE flag) ;
- fd_cant_{recv,send} : report a failure to receive/send on the FD
corresponding to EAGAIN (clears the READY flag) ;
- fd_may_{recv,send} : report the ability to receive/send on the FD
as reported by poll() (sets the READY flag) ;
Some functions are used to report the current FD status :
- fd_{recv,send}_active
- fd_{recv,send}_ready
- fd_{recv,send}_polled
Some functions were removed :
- fd_ev_clr(), fd_ev_set(), fd_ev_rem(), fd_ev_wai()
The POLLHUP/POLLERR flags are now reported as ready so that the I/O layers
knows it can try to access the file descriptor to get this information.
In order to simplify the conditions to add/remove cache entries, a new
function fd_alloc_or_release_cache_entry() was created to be used from
pollers while scanning for updates.
The following pollers have been updated :
ev_select() : done, built, tested on Linux 3.10
ev_poll() : done, built, tested on Linux 3.10
ev_epoll() : done, built, tested on Linux 3.10 & 3.13
ev_kqueue() : done, built, tested on OpenBSD 5.2
2014-01-10 15:58:45 +00:00
|
|
|
continue;
|
2018-01-20 18:30:13 +00:00
|
|
|
}
|
2018-04-25 14:58:25 +00:00
|
|
|
_update_fd(fd, &max_add_fd);
|
|
|
|
}
|
|
|
|
/* Now scan the global update list */
|
|
|
|
for (old_fd = fd = update_list.first; fd != -1; fd = fdtab[fd].update.next) {
|
|
|
|
if (fd == -2) {
|
|
|
|
fd = old_fd;
|
|
|
|
continue;
|
MAJOR: polling: rework the whole polling system
This commit heavily changes the polling system in order to definitely
fix the frequent breakage of SSL which needs to remember the last
EAGAIN before deciding whether to poll or not. Now we have a state per
direction for each FD, as opposed to a previous and current state
previously. An FD can have up to 8 different states for each direction,
each of which being the result of a 3-bit combination. These 3 bits
indicate a wish to access the FD, the readiness of the FD and the
subscription of the FD to the polling system.
This means that it will now be possible to remember the state of a
file descriptor across disable/enable sequences that generally happen
during forwarding, where enabling reading on a previously disabled FD
would result in forgetting the EAGAIN flag it met last time.
Several new state manipulation functions have been introduced or
adapted :
- fd_want_{recv,send} : enable receiving/sending on the FD regardless
of its state (sets the ACTIVE flag) ;
- fd_stop_{recv,send} : stop receiving/sending on the FD regardless
of its state (clears the ACTIVE flag) ;
- fd_cant_{recv,send} : report a failure to receive/send on the FD
corresponding to EAGAIN (clears the READY flag) ;
- fd_may_{recv,send} : report the ability to receive/send on the FD
as reported by poll() (sets the READY flag) ;
Some functions are used to report the current FD status :
- fd_{recv,send}_active
- fd_{recv,send}_ready
- fd_{recv,send}_polled
Some functions were removed :
- fd_ev_clr(), fd_ev_set(), fd_ev_rem(), fd_ev_wai()
The POLLHUP/POLLERR flags are now reported as ready so that the I/O layers
knows it can try to access the file descriptor to get this information.
In order to simplify the conditions to add/remove cache entries, a new
function fd_alloc_or_release_cache_entry() was created to be used from
pollers while scanning for updates.
The following pollers have been updated :
ev_select() : done, built, tested on Linux 3.10
ev_poll() : done, built, tested on Linux 3.10
ev_epoll() : done, built, tested on Linux 3.10 & 3.13
ev_kqueue() : done, built, tested on OpenBSD 5.2
2014-01-10 15:58:45 +00:00
|
|
|
}
|
2018-04-25 14:58:25 +00:00
|
|
|
else if (fd <= -3)
|
|
|
|
fd = -fd -4;
|
|
|
|
if (fd == -1)
|
|
|
|
break;
|
|
|
|
if (fdtab[fd].update_mask & tid_bit) {
|
|
|
|
/* Cheat a bit, as the state is global to all pollers
|
|
|
|
* we don't need every thread ot take care of the
|
|
|
|
* update.
|
|
|
|
*/
|
|
|
|
HA_ATOMIC_AND(&fdtab[fd].update_mask, ~all_threads_mask);
|
|
|
|
done_update_polling(fd);
|
|
|
|
} else
|
|
|
|
continue;
|
|
|
|
if (!fdtab[fd].owner)
|
|
|
|
continue;
|
|
|
|
_update_fd(fd, &max_add_fd);
|
2012-11-11 15:53:50 +00:00
|
|
|
}
|
2018-01-26 20:48:23 +00:00
|
|
|
|
2018-04-25 14:58:25 +00:00
|
|
|
|
2018-01-26 20:48:23 +00:00
|
|
|
/* maybe we added at least one fd larger than maxfd */
|
|
|
|
for (old_maxfd = maxfd; old_maxfd <= max_add_fd; ) {
|
|
|
|
if (HA_ATOMIC_CAS(&maxfd, &old_maxfd, max_add_fd + 1))
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* maxfd doesn't need to be precise but it needs to cover *all* active
|
|
|
|
* FDs. Thus we only shrink it if we have such an opportunity. The algo
|
|
|
|
* is simple : look for the previous used place, try to update maxfd to
|
|
|
|
* point to it, abort if maxfd changed in the mean time.
|
|
|
|
*/
|
|
|
|
old_maxfd = maxfd;
|
|
|
|
do {
|
|
|
|
new_maxfd = old_maxfd;
|
|
|
|
while (new_maxfd - 1 >= 0 && !fdtab[new_maxfd - 1].owner)
|
|
|
|
new_maxfd--;
|
|
|
|
if (new_maxfd >= old_maxfd)
|
|
|
|
break;
|
|
|
|
} while (!HA_ATOMIC_CAS(&maxfd, &old_maxfd, new_maxfd));
|
|
|
|
|
2018-08-02 08:16:17 +00:00
|
|
|
thread_harmless_now();
|
|
|
|
|
2012-11-11 15:53:50 +00:00
|
|
|
fd_nbupdt = 0;
|
|
|
|
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
/* let's restore fdset state */
|
|
|
|
readnotnull = 0; writenotnull = 0;
|
|
|
|
for (i = 0; i < (maxfd + FD_SETSIZE - 1)/(8*sizeof(int)); i++) {
|
|
|
|
readnotnull |= (*(((int*)tmp_evts[DIR_RD])+i) = *(((int*)fd_evts[DIR_RD])+i)) != 0;
|
|
|
|
writenotnull |= (*(((int*)tmp_evts[DIR_WR])+i) = *(((int*)fd_evts[DIR_WR])+i)) != 0;
|
|
|
|
}
|
|
|
|
|
2008-07-06 22:09:58 +00:00
|
|
|
delta_ms = 0;
|
|
|
|
delta.tv_sec = 0;
|
|
|
|
delta.tv_usec = 0;
|
|
|
|
|
2015-04-13 18:44:19 +00:00
|
|
|
if (!exp) {
|
|
|
|
delta_ms = MAX_DELAY_MS;
|
|
|
|
delta.tv_sec = (MAX_DELAY_MS / 1000);
|
|
|
|
delta.tv_usec = (MAX_DELAY_MS % 1000) * 1000;
|
|
|
|
}
|
|
|
|
else if (!tick_is_expired(exp, now_ms)) {
|
|
|
|
delta_ms = TICKS_TO_MS(tick_remain(now_ms, exp)) + SCHEDULER_RESOLUTION;
|
|
|
|
if (delta_ms > MAX_DELAY_MS)
|
|
|
|
delta_ms = MAX_DELAY_MS;
|
|
|
|
delta.tv_sec = (delta_ms / 1000);
|
|
|
|
delta.tv_usec = (delta_ms % 1000) * 1000;
|
2007-04-08 14:39:58 +00:00
|
|
|
}
|
2018-01-20 18:30:13 +00:00
|
|
|
else
|
|
|
|
activity[tid].poll_exp++;
|
2007-04-08 14:39:58 +00:00
|
|
|
|
2011-09-10 14:56:42 +00:00
|
|
|
gettimeofday(&before_poll, NULL);
|
2007-04-08 14:39:58 +00:00
|
|
|
status = select(maxfd,
|
2007-04-08 15:42:27 +00:00
|
|
|
readnotnull ? tmp_evts[DIR_RD] : NULL,
|
|
|
|
writenotnull ? tmp_evts[DIR_WR] : NULL,
|
2007-04-08 14:39:58 +00:00
|
|
|
NULL,
|
2008-06-23 12:00:57 +00:00
|
|
|
&delta);
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
|
2008-06-23 12:00:57 +00:00
|
|
|
tv_update_date(delta_ms, status);
|
2011-09-10 14:56:42 +00:00
|
|
|
measure_idle();
|
2007-04-08 14:39:58 +00:00
|
|
|
|
2018-08-02 08:16:17 +00:00
|
|
|
thread_harmless_end();
|
|
|
|
|
2007-04-08 14:39:58 +00:00
|
|
|
if (status <= 0)
|
|
|
|
return;
|
|
|
|
|
2008-07-14 22:36:31 +00:00
|
|
|
for (fds = 0; (fds * BITS_PER_INT) < maxfd; fds++) {
|
2007-04-08 15:42:27 +00:00
|
|
|
if ((((int *)(tmp_evts[DIR_RD]))[fds] | ((int *)(tmp_evts[DIR_WR]))[fds]) == 0)
|
2007-04-08 14:39:58 +00:00
|
|
|
continue;
|
|
|
|
|
2008-07-14 22:36:31 +00:00
|
|
|
for (count = BITS_PER_INT, fd = fds * BITS_PER_INT; count && fd < maxfd; count--, fd++) {
|
2017-08-30 08:34:36 +00:00
|
|
|
unsigned int n = 0;
|
|
|
|
|
2018-01-20 18:30:13 +00:00
|
|
|
if (!fdtab[fd].owner) {
|
|
|
|
activity[tid].poll_dead++;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!(fdtab[fd].thread_mask & tid_bit)) {
|
|
|
|
activity[tid].poll_skip++;
|
2012-07-06 14:02:29 +00:00
|
|
|
continue;
|
2018-01-20 18:30:13 +00:00
|
|
|
}
|
2012-07-06 14:02:29 +00:00
|
|
|
|
|
|
|
if (FD_ISSET(fd, tmp_evts[DIR_RD]))
|
2017-08-30 08:34:36 +00:00
|
|
|
n |= FD_POLL_IN;
|
2007-04-08 14:39:58 +00:00
|
|
|
|
2012-07-06 14:02:29 +00:00
|
|
|
if (FD_ISSET(fd, tmp_evts[DIR_WR]))
|
2017-08-30 08:34:36 +00:00
|
|
|
n |= FD_POLL_OUT;
|
MAJOR: polling: centralize calls to I/O callbacks
In order for HTTP/2 not to eat too much memory, we'll have to support
on-the-fly buffer allocation, since most streams will have an empty
request buffer at some point. Supporting allocation on the fly means
being able to sleep inside I/O callbacks if a buffer is not available.
Till now, the I/O callbacks were called from two locations :
- when processing the cached events
- when processing the polled events from the poller
This change cleans up the design a bit further than what was started in
1.5. It now ensures that we never call any iocb from the poller itself
and that instead, events learned by the poller are put into the cache.
The benefit is important in terms of stability : we don't have to care
anymore about the risk that new events are added into the poller while
processing its events, and we're certain that updates are processed at
a single location.
To achieve this, we now modify all the fd_* functions so that instead of
creating updates, they add/remove the fd to/from the cache depending on
its state, and only create an update when the polling status reaches a
state where it will have to change. Since the pollers make use of these
functions to notify readiness (using fd_may_recv/fd_may_send), the cache
is always up to date with the poller.
Creating updates only when the polling status needs to change saves a
significant amount of work for the pollers : a benchmark showed that on
a typical TCP proxy test, the amount of updates per connection dropped
from 11 to 1 on average. This also means that the update list is smaller
and has more chances of not thrashing too many CPU cache lines. The first
observed benefit is a net 2% performance gain on the connection rate.
A second benefit is that when a connection is accepted, it's only when
we're processing the cache, and the recv event is automatically added
into the cache *after* the current one, resulting in this event to be
processed immediately during the same loop. Previously we used to have
a second run over the updates to detect if new events were added to
catch them before waking up tasks.
The next gain will be offered by the next steps on this subject consisting
in implementing an I/O queue containing all cached events ordered by priority
just like the run queue, and to be able to leave some events pending there
as long as needed. That will allow us *not* to perform some FD processing
if it's not the proper time for this (typically keep waiting for a buffer
to be allocated if none is available for an recv()). And by only processing
a small bunch of them, we'll allow priorities to take place even at the I/O
level.
As a result of this change, functions fd_alloc_or_release_cache_entry()
and fd_process_polled_events() have disappeared, and the code dedicated
to checking for new fd events after the callback during the poll() loop
was removed as well. Despite the patch looking large, it's mostly a
change of what function is falled upon fd_*() and almost nothing was
added.
2014-11-19 18:43:05 +00:00
|
|
|
|
2017-08-30 08:34:36 +00:00
|
|
|
fd_update_events(fd, n);
|
2007-04-08 14:39:58 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
static int init_select_per_thread()
|
|
|
|
{
|
|
|
|
int fd_set_bytes;
|
|
|
|
|
|
|
|
fd_set_bytes = sizeof(fd_set) * (global.maxsock + FD_SETSIZE - 1) / FD_SETSIZE;
|
|
|
|
if ((tmp_evts[DIR_RD] = (fd_set *)calloc(1, fd_set_bytes)) == NULL)
|
|
|
|
goto fail;
|
|
|
|
if ((tmp_evts[DIR_WR] = (fd_set *)calloc(1, fd_set_bytes)) == NULL)
|
|
|
|
goto fail;
|
|
|
|
return 1;
|
|
|
|
fail:
|
|
|
|
free(tmp_evts[DIR_RD]);
|
|
|
|
free(tmp_evts[DIR_WR]);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void deinit_select_per_thread()
|
|
|
|
{
|
2017-10-27 11:53:47 +00:00
|
|
|
free(tmp_evts[DIR_WR]); tmp_evts[DIR_WR] = NULL;
|
|
|
|
free(tmp_evts[DIR_RD]); tmp_evts[DIR_RD] = NULL;
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
}
|
|
|
|
|
2007-04-09 07:23:31 +00:00
|
|
|
/*
|
|
|
|
* Initialization of the select() poller.
|
|
|
|
* Returns 0 in case of failure, non-zero in case of success. If it fails, it
|
|
|
|
* disables the poller by setting its pref to 0.
|
|
|
|
*/
|
2007-04-15 22:25:25 +00:00
|
|
|
REGPRM1 static int _do_init(struct poller *p)
|
2007-04-09 07:23:31 +00:00
|
|
|
{
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
__label__ fail_swevt, fail_srevt, fail_revt;
|
2007-04-09 07:23:31 +00:00
|
|
|
int fd_set_bytes;
|
|
|
|
|
|
|
|
p->private = NULL;
|
2013-03-31 12:41:15 +00:00
|
|
|
|
|
|
|
if (global.maxsock > FD_SETSIZE)
|
|
|
|
goto fail_revt;
|
|
|
|
|
2007-04-09 07:23:31 +00:00
|
|
|
fd_set_bytes = sizeof(fd_set) * (global.maxsock + FD_SETSIZE - 1) / FD_SETSIZE;
|
|
|
|
|
2018-01-25 15:48:46 +00:00
|
|
|
if ((fd_evts[DIR_RD] = calloc(1, fd_set_bytes)) == NULL)
|
2007-04-09 07:23:31 +00:00
|
|
|
goto fail_srevt;
|
2018-01-25 15:48:46 +00:00
|
|
|
if ((fd_evts[DIR_WR] = calloc(1, fd_set_bytes)) == NULL)
|
2007-04-09 07:23:31 +00:00
|
|
|
goto fail_swevt;
|
|
|
|
|
2017-10-27 11:53:47 +00:00
|
|
|
hap_register_per_thread_init(init_select_per_thread);
|
|
|
|
hap_register_per_thread_deinit(deinit_select_per_thread);
|
|
|
|
|
2007-04-09 07:23:31 +00:00
|
|
|
return 1;
|
|
|
|
|
|
|
|
fail_swevt:
|
|
|
|
free(fd_evts[DIR_RD]);
|
|
|
|
fail_srevt:
|
|
|
|
free(tmp_evts[DIR_WR]);
|
|
|
|
free(tmp_evts[DIR_RD]);
|
|
|
|
fail_revt:
|
|
|
|
p->pref = 0;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Termination of the select() poller.
|
|
|
|
* Memory is released and the poller is marked as unselectable.
|
|
|
|
*/
|
2007-04-15 22:25:25 +00:00
|
|
|
REGPRM1 static void _do_term(struct poller *p)
|
2007-04-09 07:23:31 +00:00
|
|
|
{
|
2008-08-03 10:19:50 +00:00
|
|
|
free(fd_evts[DIR_WR]);
|
|
|
|
free(fd_evts[DIR_RD]);
|
2007-04-09 07:23:31 +00:00
|
|
|
p->private = NULL;
|
|
|
|
p->pref = 0;
|
|
|
|
}
|
|
|
|
|
2007-04-09 17:29:56 +00:00
|
|
|
/*
|
|
|
|
* Check that the poller works.
|
|
|
|
* Returns 1 if OK, otherwise 0.
|
|
|
|
*/
|
2007-04-15 22:25:25 +00:00
|
|
|
REGPRM1 static int _do_test(struct poller *p)
|
2007-04-09 17:29:56 +00:00
|
|
|
{
|
2013-03-31 12:41:15 +00:00
|
|
|
if (global.maxsock > FD_SETSIZE)
|
|
|
|
return 0;
|
|
|
|
|
2007-04-09 17:29:56 +00:00
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2007-04-08 14:39:58 +00:00
|
|
|
/*
|
2007-04-15 22:25:25 +00:00
|
|
|
* It is a constructor, which means that it will automatically be called before
|
|
|
|
* main(). This is GCC-specific but it works at least since 2.95.
|
|
|
|
* Special care must be taken so that it does not need any uninitialized data.
|
2007-04-08 14:39:58 +00:00
|
|
|
*/
|
2007-04-15 22:25:25 +00:00
|
|
|
__attribute__((constructor))
|
|
|
|
static void _do_register(void)
|
2007-04-08 14:39:58 +00:00
|
|
|
{
|
2007-04-15 22:25:25 +00:00
|
|
|
struct poller *p;
|
|
|
|
|
|
|
|
if (nbpollers >= MAX_POLLERS)
|
|
|
|
return;
|
|
|
|
p = &pollers[nbpollers++];
|
|
|
|
|
2007-04-08 14:39:58 +00:00
|
|
|
p->name = "select";
|
|
|
|
p->pref = 150;
|
2017-03-13 10:38:28 +00:00
|
|
|
p->flags = 0;
|
2007-04-08 14:39:58 +00:00
|
|
|
p->private = NULL;
|
|
|
|
|
2012-11-11 20:02:34 +00:00
|
|
|
p->clo = __fd_clo;
|
2007-04-15 22:25:25 +00:00
|
|
|
p->test = _do_test;
|
|
|
|
p->init = _do_init;
|
|
|
|
p->term = _do_term;
|
|
|
|
p->poll = _do_poll;
|
2007-04-08 14:39:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Local variables:
|
|
|
|
* c-indent-level: 8
|
|
|
|
* c-basic-offset: 8
|
|
|
|
* End:
|
|
|
|
*/
|