2017-10-12 14:09:09 +00:00
|
|
|
/*
|
|
|
|
* include/common/hathreads.h
|
|
|
|
* definitions, macros and inline functions about threads.
|
|
|
|
*
|
|
|
|
* Copyright (C) 2017 Christopher Fauet - cfaulet@haproxy.com
|
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation, version 2.1
|
|
|
|
* exclusively.
|
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
|
|
* License along with this library; if not, write to the Free Software
|
|
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef _COMMON_HATHREADS_H
|
|
|
|
#define _COMMON_HATHREADS_H
|
|
|
|
|
|
|
|
#include <common/config.h>
|
|
|
|
|
|
|
|
#define MAX_THREADS_MASK ((unsigned long)-1)
|
|
|
|
extern THREAD_LOCAL unsigned int tid; /* The thread id */
|
2017-11-14 09:16:04 +00:00
|
|
|
extern THREAD_LOCAL unsigned long tid_bit; /* The bit corresponding to the thread id */
|
2017-10-12 14:09:09 +00:00
|
|
|
|
|
|
|
#ifndef USE_THREAD
|
|
|
|
|
2018-01-20 17:19:22 +00:00
|
|
|
#define MAX_THREADS 1
|
|
|
|
|
2017-11-13 09:34:01 +00:00
|
|
|
#define __decl_hathreads(decl)
|
|
|
|
|
2017-10-12 14:09:09 +00:00
|
|
|
#define HA_ATOMIC_CAS(val, old, new) ({((*val) == (*old)) ? (*(val) = (new) , 1) : (*(old) = *(val), 0);})
|
|
|
|
#define HA_ATOMIC_ADD(val, i) ({*(val) += (i);})
|
|
|
|
#define HA_ATOMIC_SUB(val, i) ({*(val) -= (i);})
|
|
|
|
#define HA_ATOMIC_AND(val, flags) ({*(val) &= (flags);})
|
|
|
|
#define HA_ATOMIC_OR(val, flags) ({*(val) |= (flags);})
|
|
|
|
#define HA_ATOMIC_XCHG(val, new) \
|
|
|
|
({ \
|
|
|
|
typeof(*(val)) __old = *(val); \
|
|
|
|
*(val) = new; \
|
|
|
|
__old; \
|
|
|
|
})
|
|
|
|
#define HA_ATOMIC_STORE(val, new) ({*(val) = new;})
|
|
|
|
#define HA_ATOMIC_UPDATE_MAX(val, new) \
|
|
|
|
({ \
|
|
|
|
typeof(*(val)) __new = (new); \
|
|
|
|
\
|
|
|
|
if (*(val) < __new) \
|
|
|
|
*(val) = __new; \
|
|
|
|
*(val); \
|
|
|
|
})
|
|
|
|
|
|
|
|
#define HA_ATOMIC_UPDATE_MIN(val, new) \
|
|
|
|
({ \
|
|
|
|
typeof(*(val)) __new = (new); \
|
|
|
|
\
|
|
|
|
if (*(val) > __new) \
|
|
|
|
*(val) = __new; \
|
|
|
|
*(val); \
|
|
|
|
})
|
|
|
|
|
2017-10-31 17:00:20 +00:00
|
|
|
#define HA_BARRIER() do { } while (0)
|
2017-10-19 09:59:15 +00:00
|
|
|
|
|
|
|
#define THREAD_SYNC_INIT(m) do { /* do nothing */ } while(0)
|
|
|
|
#define THREAD_SYNC_ENABLE() do { /* do nothing */ } while(0)
|
|
|
|
#define THREAD_WANT_SYNC() do { /* do nothing */ } while(0)
|
|
|
|
#define THREAD_ENTER_SYNC() do { /* do nothing */ } while(0)
|
|
|
|
#define THREAD_EXIT_SYNC() do { /* do nothing */ } while(0)
|
|
|
|
#define THREAD_NO_SYNC() ({ 0; })
|
|
|
|
#define THREAD_NEED_SYNC() ({ 1; })
|
|
|
|
|
2017-11-07 09:42:54 +00:00
|
|
|
#define HA_SPIN_INIT(l) do { /* do nothing */ } while(0)
|
|
|
|
#define HA_SPIN_DESTROY(l) do { /* do nothing */ } while(0)
|
|
|
|
#define HA_SPIN_LOCK(lbl, l) do { /* do nothing */ } while(0)
|
|
|
|
#define HA_SPIN_TRYLOCK(lbl, l) ({ 0; })
|
|
|
|
#define HA_SPIN_UNLOCK(lbl, l) do { /* do nothing */ } while(0)
|
|
|
|
|
|
|
|
#define HA_RWLOCK_INIT(l) do { /* do nothing */ } while(0)
|
|
|
|
#define HA_RWLOCK_DESTROY(l) do { /* do nothing */ } while(0)
|
|
|
|
#define HA_RWLOCK_WRLOCK(lbl, l) do { /* do nothing */ } while(0)
|
|
|
|
#define HA_RWLOCK_TRYWRLOCK(lbl, l) ({ 0; })
|
|
|
|
#define HA_RWLOCK_WRUNLOCK(lbl, l) do { /* do nothing */ } while(0)
|
|
|
|
#define HA_RWLOCK_RDLOCK(lbl, l) do { /* do nothing */ } while(0)
|
|
|
|
#define HA_RWLOCK_TRYRDLOCK(lbl, l) ({ 0; })
|
|
|
|
#define HA_RWLOCK_RDUNLOCK(lbl, l) do { /* do nothing */ } while(0)
|
2017-10-12 14:09:09 +00:00
|
|
|
|
|
|
|
#else /* USE_THREAD */
|
|
|
|
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include <pthread.h>
|
|
|
|
#include <import/plock.h>
|
|
|
|
|
2018-01-20 17:19:22 +00:00
|
|
|
#define MAX_THREADS LONGBITS
|
|
|
|
|
2017-11-13 09:34:01 +00:00
|
|
|
#define __decl_hathreads(decl) decl
|
|
|
|
|
2017-10-12 14:09:09 +00:00
|
|
|
/* TODO: thread: For now, we rely on GCC builtins but it could be a good idea to
|
|
|
|
* have a header file regrouping all functions dealing with threads. */
|
2018-01-04 17:49:31 +00:00
|
|
|
|
2018-01-11 14:20:43 +00:00
|
|
|
#if defined(__GNUC__) && (__GNUC__ < 4 || __GNUC__ == 4 && __GNUC_MINOR__ < 7) && !defined(__clang__)
|
2018-01-04 17:49:31 +00:00
|
|
|
/* gcc < 4.7 */
|
|
|
|
|
|
|
|
#define HA_ATOMIC_ADD(val, i) __sync_add_and_fetch(val, i)
|
|
|
|
#define HA_ATOMIC_SUB(val, i) __sync_sub_and_fetch(val, i)
|
|
|
|
#define HA_ATOMIC_AND(val, flags) __sync_and_and_fetch(val, flags)
|
|
|
|
#define HA_ATOMIC_OR(val, flags) __sync_or_and_fetch(val, flags)
|
|
|
|
|
|
|
|
/* the CAS is a bit complicated. The older API doesn't support returning the
|
|
|
|
* value and the swap's result at the same time. So here we take what looks
|
|
|
|
* like the safest route, consisting in using the boolean version guaranteeing
|
|
|
|
* that the operation was performed or not, and we snoop a previous value. If
|
|
|
|
* the compare succeeds, we return. If it fails, we return the previous value,
|
|
|
|
* but only if it differs from the expected one. If it's the same it's a race
|
|
|
|
* thus we try again to avoid confusing a possibly sensitive caller.
|
|
|
|
*/
|
|
|
|
#define HA_ATOMIC_CAS(val, old, new) \
|
|
|
|
({ \
|
|
|
|
typeof((val)) __val = (val); \
|
|
|
|
typeof((old)) __oldp = (old); \
|
|
|
|
typeof(*(old)) __oldv; \
|
|
|
|
typeof((new)) __new = (new); \
|
|
|
|
int __ret; \
|
|
|
|
do { \
|
|
|
|
__oldv = *__val; \
|
|
|
|
__ret = __sync_bool_compare_and_swap(__val, *__oldp, __new); \
|
|
|
|
} while (!__ret && *__oldp == __oldv); \
|
|
|
|
if (!__ret) \
|
|
|
|
*__oldp = __oldv; \
|
|
|
|
__ret; \
|
|
|
|
})
|
|
|
|
|
|
|
|
#define HA_ATOMIC_XCHG(val, new) \
|
|
|
|
({ \
|
|
|
|
typeof((val)) __val = (val); \
|
|
|
|
typeof(*(val)) __old; \
|
|
|
|
typeof((new)) __new = (new); \
|
|
|
|
do { __old = *__val; \
|
|
|
|
} while (!__sync_bool_compare_and_swap(__val, __old, __new)); \
|
|
|
|
__old; \
|
|
|
|
})
|
|
|
|
#define HA_ATOMIC_STORE(val, new) \
|
|
|
|
({ \
|
|
|
|
typeof((val)) __val = (val); \
|
|
|
|
typeof(*(val)) __old; \
|
|
|
|
typeof((new)) __new = (new); \
|
|
|
|
do { __old = *__val; \
|
|
|
|
} while (!__sync_bool_compare_and_swap(__val, __old, __new)); \
|
|
|
|
})
|
|
|
|
#else
|
|
|
|
/* gcc >= 4.7 */
|
2017-10-12 14:09:09 +00:00
|
|
|
#define HA_ATOMIC_CAS(val, old, new) __atomic_compare_exchange_n(val, old, new, 0, 0, 0)
|
|
|
|
#define HA_ATOMIC_ADD(val, i) __atomic_add_fetch(val, i, 0)
|
|
|
|
#define HA_ATOMIC_SUB(val, i) __atomic_sub_fetch(val, i, 0)
|
|
|
|
#define HA_ATOMIC_AND(val, flags) __atomic_and_fetch(val, flags, 0)
|
|
|
|
#define HA_ATOMIC_OR(val, flags) __atomic_or_fetch(val, flags, 0)
|
|
|
|
#define HA_ATOMIC_XCHG(val, new) __atomic_exchange_n(val, new, 0)
|
|
|
|
#define HA_ATOMIC_STORE(val, new) __atomic_store_n(val, new, 0)
|
2018-01-04 17:49:31 +00:00
|
|
|
#endif
|
|
|
|
|
2017-10-12 14:09:09 +00:00
|
|
|
#define HA_ATOMIC_UPDATE_MAX(val, new) \
|
|
|
|
({ \
|
|
|
|
typeof(*(val)) __old = *(val); \
|
|
|
|
typeof(*(val)) __new = (new); \
|
|
|
|
\
|
|
|
|
while (__old < __new && !HA_ATOMIC_CAS(val, &__old, __new)); \
|
|
|
|
(*val); \
|
|
|
|
})
|
|
|
|
#define HA_ATOMIC_UPDATE_MIN(val, new) \
|
|
|
|
({ \
|
|
|
|
typeof((*val)) __old = *(val); \
|
|
|
|
typeof((*val)) __new = (new); \
|
|
|
|
\
|
|
|
|
while (__old > __new && !HA_ATOMIC_CAS(val, &__old, __new)); \
|
|
|
|
(*val); \
|
|
|
|
})
|
|
|
|
|
2017-10-31 17:00:20 +00:00
|
|
|
#define HA_BARRIER() pl_barrier()
|
|
|
|
|
2017-10-19 09:59:15 +00:00
|
|
|
#define THREAD_SYNC_INIT(m) thread_sync_init(m)
|
|
|
|
#define THREAD_SYNC_ENABLE() thread_sync_enable()
|
|
|
|
#define THREAD_WANT_SYNC() thread_want_sync()
|
|
|
|
#define THREAD_ENTER_SYNC() thread_enter_sync()
|
|
|
|
#define THREAD_EXIT_SYNC() thread_exit_sync()
|
|
|
|
#define THREAD_NO_SYNC() thread_no_sync()
|
|
|
|
#define THREAD_NEED_SYNC() thread_need_sync()
|
|
|
|
|
|
|
|
int thread_sync_init(unsigned long mask);
|
|
|
|
void thread_sync_enable(void);
|
|
|
|
void thread_want_sync(void);
|
|
|
|
void thread_enter_sync(void);
|
|
|
|
void thread_exit_sync(void);
|
|
|
|
int thread_no_sync(void);
|
|
|
|
int thread_need_sync(void);
|
|
|
|
|
2017-10-12 14:09:09 +00:00
|
|
|
#if defined(DEBUG_THREAD) || defined(DEBUG_FULL)
|
|
|
|
|
|
|
|
enum lock_label {
|
2017-10-19 09:59:15 +00:00
|
|
|
THREAD_SYNC_LOCK = 0,
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
FDCACHE_LOCK,
|
|
|
|
FD_LOCK,
|
2017-09-27 12:59:38 +00:00
|
|
|
TASK_RQ_LOCK,
|
|
|
|
TASK_WQ_LOCK,
|
2017-08-29 07:52:38 +00:00
|
|
|
POOL_LOCK,
|
2017-05-30 13:36:50 +00:00
|
|
|
LISTENER_LOCK,
|
|
|
|
LISTENER_QUEUE_LOCK,
|
2017-06-02 13:33:24 +00:00
|
|
|
PROXY_LOCK,
|
2017-06-08 12:04:45 +00:00
|
|
|
SERVER_LOCK,
|
2017-10-16 10:00:40 +00:00
|
|
|
UPDATED_SERVERS_LOCK,
|
2017-06-09 12:17:53 +00:00
|
|
|
LBPRM_LOCK,
|
2017-05-30 13:34:30 +00:00
|
|
|
SIGNALS_LOCK,
|
2017-06-13 17:37:32 +00:00
|
|
|
STK_TABLE_LOCK,
|
|
|
|
STK_SESS_LOCK,
|
2017-06-19 10:38:55 +00:00
|
|
|
APPLETS_LOCK,
|
2017-06-19 15:46:37 +00:00
|
|
|
PEER_LOCK,
|
2017-06-21 13:42:52 +00:00
|
|
|
BUF_WQ_LOCK,
|
2017-06-30 14:23:45 +00:00
|
|
|
STRMS_LOCK,
|
2017-06-15 14:37:39 +00:00
|
|
|
SSL_LOCK,
|
|
|
|
SSL_GEN_CERTS_LOCK,
|
2017-07-03 09:34:05 +00:00
|
|
|
PATREF_LOCK,
|
|
|
|
PATEXP_LOCK,
|
|
|
|
PATLRU_LOCK,
|
2017-07-24 14:30:34 +00:00
|
|
|
VARS_LOCK,
|
2017-07-25 09:07:15 +00:00
|
|
|
COMP_POOL_LOCK,
|
2017-07-12 09:41:21 +00:00
|
|
|
LUA_LOCK,
|
2017-07-16 22:14:07 +00:00
|
|
|
NOTIF_LOCK,
|
2017-09-25 12:48:02 +00:00
|
|
|
SPOE_APPLET_LOCK,
|
2017-10-04 14:17:58 +00:00
|
|
|
DNS_LOCK,
|
2017-10-20 13:40:23 +00:00
|
|
|
PID_LIST_LOCK,
|
2017-10-23 13:54:24 +00:00
|
|
|
EMAIL_ALERTS_LOCK,
|
2017-11-07 10:19:48 +00:00
|
|
|
PIPES_LOCK,
|
BUG/MEDIUM: threads/mworker: fix a race on startup
Marc Fournier reported an interesting case when using threads with the
master-worker mode : sometimes, a listener would have its FD closed
during startup. Sometimes it could even be health checks seeing this.
What happens is that after the threads are created, and the pollers
enabled on each threads, the master-worker pipe is registered, and at
the same time a close() is performed on the write side of this pipe
since the children must not use it.
But since this is replicated in every thread, what happens is that the
first thread closes the pipe, thus releases the FD, and the next thread
starting a listener in parallel gets this FD reassigned. Then another
thread closes the FD again, which this time corresponds to the listener.
It can also happen with the health check sockets if they're started
early enough.
This patch splits the mworker_pipe_register() function in two, so that
the close() of the write side of the FD is performed very early after the
fork() and long before threads are created (we don't need to delay it
anyway). Only the pipe registration is done in the threaded code since
it is important that the pollers are properly allocated for this.
The mworker_pipe_register() function now takes care of registering the
pipe only once, and this is guaranteed by a new surrounding lock.
The call to protocol_enable_all() looks fragile in theory since it
scans the list of proxies and their listeners, though in practice
all threads scan the same list and take the same locks for each
listener so it's not possible that any of them escapes the process
and finishes before all listeners are started. And the operation is
idempotent.
This fix must be backported to 1.8. Thanks to Marc for providing very
detailed traces clearly showing the problem.
2018-01-23 18:01:49 +00:00
|
|
|
START_LOCK,
|
2017-10-19 09:59:15 +00:00
|
|
|
LOCK_LABELS
|
2017-10-12 14:09:09 +00:00
|
|
|
};
|
|
|
|
struct lock_stat {
|
|
|
|
uint64_t nsec_wait_for_write;
|
|
|
|
uint64_t nsec_wait_for_read;
|
|
|
|
uint64_t num_write_locked;
|
|
|
|
uint64_t num_write_unlocked;
|
|
|
|
uint64_t num_read_locked;
|
|
|
|
uint64_t num_read_unlocked;
|
|
|
|
};
|
|
|
|
|
|
|
|
extern struct lock_stat lock_stats[LOCK_LABELS];
|
|
|
|
|
|
|
|
#define __HA_SPINLOCK_T unsigned long
|
|
|
|
|
|
|
|
#define __SPIN_INIT(l) ({ (*l) = 0; })
|
|
|
|
#define __SPIN_DESTROY(l) ({ (*l) = 0; })
|
2017-11-06 00:03:26 +00:00
|
|
|
#define __SPIN_LOCK(l) pl_take_s(l)
|
|
|
|
#define __SPIN_TRYLOCK(l) !pl_try_s(l)
|
|
|
|
#define __SPIN_UNLOCK(l) pl_drop_s(l)
|
2017-10-12 14:09:09 +00:00
|
|
|
|
|
|
|
#define __HA_RWLOCK_T unsigned long
|
|
|
|
|
|
|
|
#define __RWLOCK_INIT(l) ({ (*l) = 0; })
|
|
|
|
#define __RWLOCK_DESTROY(l) ({ (*l) = 0; })
|
|
|
|
#define __RWLOCK_WRLOCK(l) pl_take_w(l)
|
|
|
|
#define __RWLOCK_TRYWRLOCK(l) !pl_try_w(l)
|
|
|
|
#define __RWLOCK_WRUNLOCK(l) pl_drop_w(l)
|
|
|
|
#define __RWLOCK_RDLOCK(l) pl_take_r(l)
|
|
|
|
#define __RWLOCK_TRYRDLOCK(l) !pl_try_r(l)
|
|
|
|
#define __RWLOCK_RDUNLOCK(l) pl_drop_r(l)
|
|
|
|
|
|
|
|
#define HA_SPINLOCK_T struct ha_spinlock
|
|
|
|
|
2017-11-07 09:42:54 +00:00
|
|
|
#define HA_SPIN_INIT(l) __spin_init(l)
|
|
|
|
#define HA_SPIN_DESTROY(l) __spin_destroy(l)
|
2017-10-12 14:09:09 +00:00
|
|
|
|
2017-11-07 09:42:54 +00:00
|
|
|
#define HA_SPIN_LOCK(lbl, l) __spin_lock(lbl, l, __func__, __FILE__, __LINE__)
|
|
|
|
#define HA_SPIN_TRYLOCK(lbl, l) __spin_trylock(lbl, l, __func__, __FILE__, __LINE__)
|
|
|
|
#define HA_SPIN_UNLOCK(lbl, l) __spin_unlock(lbl, l, __func__, __FILE__, __LINE__)
|
2017-10-12 14:09:09 +00:00
|
|
|
|
|
|
|
#define HA_RWLOCK_T struct ha_rwlock
|
|
|
|
|
2017-11-07 09:42:54 +00:00
|
|
|
#define HA_RWLOCK_INIT(l) __ha_rwlock_init((l))
|
|
|
|
#define HA_RWLOCK_DESTROY(l) __ha_rwlock_destroy((l))
|
|
|
|
#define HA_RWLOCK_WRLOCK(lbl,l) __ha_rwlock_wrlock(lbl, l, __func__, __FILE__, __LINE__)
|
|
|
|
#define HA_RWLOCK_TRYWRLOCK(lbl,l) __ha_rwlock_trywrlock(lbl, l, __func__, __FILE__, __LINE__)
|
|
|
|
#define HA_RWLOCK_WRUNLOCK(lbl,l) __ha_rwlock_wrunlock(lbl, l, __func__, __FILE__, __LINE__)
|
|
|
|
#define HA_RWLOCK_RDLOCK(lbl,l) __ha_rwlock_rdlock(lbl, l)
|
|
|
|
#define HA_RWLOCK_TRYRDLOCK(lbl,l) __ha_rwlock_tryrdlock(lbl, l)
|
|
|
|
#define HA_RWLOCK_RDUNLOCK(lbl,l) __ha_rwlock_rdunlock(lbl, l)
|
2017-10-12 14:09:09 +00:00
|
|
|
|
|
|
|
struct ha_spinlock {
|
|
|
|
__HA_SPINLOCK_T lock;
|
|
|
|
struct {
|
|
|
|
unsigned long owner; /* a bit is set to 1 << tid for the lock owner */
|
|
|
|
unsigned long waiters; /* a bit is set to 1 << tid for waiting threads */
|
|
|
|
struct {
|
|
|
|
const char *function;
|
|
|
|
const char *file;
|
|
|
|
int line;
|
|
|
|
} last_location; /* location of the last owner */
|
|
|
|
} info;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct ha_rwlock {
|
|
|
|
__HA_RWLOCK_T lock;
|
|
|
|
struct {
|
|
|
|
unsigned long cur_writer; /* a bit is set to 1 << tid for the lock owner */
|
|
|
|
unsigned long wait_writers; /* a bit is set to 1 << tid for waiting writers */
|
|
|
|
unsigned long cur_readers; /* a bit is set to 1 << tid for current readers */
|
|
|
|
unsigned long wait_readers; /* a bit is set to 1 << tid for waiting waiters */
|
|
|
|
struct {
|
|
|
|
const char *function;
|
|
|
|
const char *file;
|
|
|
|
int line;
|
|
|
|
} last_location; /* location of the last write owner */
|
|
|
|
} info;
|
|
|
|
};
|
|
|
|
|
|
|
|
static inline void show_lock_stats()
|
|
|
|
{
|
MAJOR: threads/fd: Make fd stuffs thread-safe
Many changes have been made to do so. First, the fd_updt array, where all
pending FDs for polling are stored, is now a thread-local array. Then 3 locks
have been added to protect, respectively, the fdtab array, the fd_cache array
and poll information. In addition, a lock for each entry in the fdtab array has
been added to protect all accesses to a specific FD or its information.
For pollers, according to the poller, the way to manage the concurrency is
different. There is a poller loop on each thread. So the set of monitored FDs
may need to be protected. epoll and kqueue are thread-safe per-se, so there few
things to do to protect these pollers. This is not possible with select and
poll, so there is no sharing between the threads. The poller on each thread is
independant from others.
Finally, per-thread init/deinit functions are used for each pollers and for FD
part for manage thread-local ressources.
Now, you must be carefull when a FD is created during the HAProxy startup. All
update on the FD state must be made in the threads context and never before
their creation. This is mandatory because fd_updt array is thread-local and
initialized only for threads. Because there is no pollers for the main one, this
array remains uninitialized in this context. For this reason, listeners are now
enabled in run_thread_poll_loop function, just like the worker pipe.
2017-05-29 08:40:41 +00:00
|
|
|
const char *labels[LOCK_LABELS] = {"THREAD_SYNC", "FDTAB", "FDCACHE", "FD", "POLL",
|
2017-05-30 13:34:30 +00:00
|
|
|
"TASK_RQ", "TASK_WQ", "POOL",
|
2017-06-08 12:04:45 +00:00
|
|
|
"LISTENER", "LISTENER_QUEUE", "PROXY", "SERVER",
|
2017-06-19 10:38:55 +00:00
|
|
|
"UPDATED_SERVERS", "LBPRM", "SIGNALS", "STK_TABLE", "STK_SESS",
|
2017-07-03 09:34:05 +00:00
|
|
|
"APPLETS", "PEER", "BUF_WQ", "STREAMS", "SSL", "SSL_GEN_CERTS",
|
2017-07-16 22:14:07 +00:00
|
|
|
"PATREF", "PATEXP", "PATLRU", "VARS", "COMP_POOL", "LUA",
|
2017-11-07 10:19:48 +00:00
|
|
|
"NOTIF", "SPOE_APPLET", "DNS", "PID_LIST", "EMAIL_ALERTS",
|
|
|
|
"PIPES" };
|
2017-10-12 14:09:09 +00:00
|
|
|
int lbl;
|
|
|
|
|
|
|
|
for (lbl = 0; lbl < LOCK_LABELS; lbl++) {
|
|
|
|
fprintf(stderr,
|
|
|
|
"Stats about Lock %s: \n"
|
|
|
|
"\t # write lock : %lu\n"
|
|
|
|
"\t # write unlock: %lu (%ld)\n"
|
|
|
|
"\t # wait time for write : %.3f msec\n"
|
|
|
|
"\t # wait time for write/lock: %.3f nsec\n"
|
|
|
|
"\t # read lock : %lu\n"
|
|
|
|
"\t # read unlock : %lu (%ld)\n"
|
|
|
|
"\t # wait time for read : %.3f msec\n"
|
|
|
|
"\t # wait time for read/lock : %.3f nsec\n",
|
|
|
|
labels[lbl],
|
|
|
|
lock_stats[lbl].num_write_locked,
|
|
|
|
lock_stats[lbl].num_write_unlocked,
|
|
|
|
lock_stats[lbl].num_write_unlocked - lock_stats[lbl].num_write_locked,
|
|
|
|
(double)lock_stats[lbl].nsec_wait_for_write / 1000000.0,
|
|
|
|
lock_stats[lbl].num_write_locked ? ((double)lock_stats[lbl].nsec_wait_for_write / (double)lock_stats[lbl].num_write_locked) : 0,
|
|
|
|
lock_stats[lbl].num_read_locked,
|
|
|
|
lock_stats[lbl].num_read_unlocked,
|
|
|
|
lock_stats[lbl].num_read_unlocked - lock_stats[lbl].num_read_locked,
|
|
|
|
(double)lock_stats[lbl].nsec_wait_for_read / 1000000.0,
|
|
|
|
lock_stats[lbl].num_read_locked ? ((double)lock_stats[lbl].nsec_wait_for_read / (double)lock_stats[lbl].num_read_locked) : 0);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Following functions are used to collect some stats about locks. We wrap
|
|
|
|
* pthread functions to known how much time we wait in a lock. */
|
|
|
|
|
|
|
|
static uint64_t nsec_now(void) {
|
|
|
|
struct timespec ts;
|
|
|
|
|
|
|
|
clock_gettime(CLOCK_MONOTONIC, &ts);
|
|
|
|
return ((uint64_t) ts.tv_sec * 1000000000ULL +
|
|
|
|
(uint64_t) ts.tv_nsec);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __ha_rwlock_init(struct ha_rwlock *l)
|
|
|
|
{
|
|
|
|
memset(l, 0, sizeof(struct ha_rwlock));
|
|
|
|
__RWLOCK_INIT(&l->lock);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __ha_rwlock_destroy(struct ha_rwlock *l)
|
|
|
|
{
|
|
|
|
__RWLOCK_DESTROY(&l->lock);
|
|
|
|
memset(l, 0, sizeof(struct ha_rwlock));
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static inline void __ha_rwlock_wrlock(enum lock_label lbl, struct ha_rwlock *l,
|
|
|
|
const char *func, const char *file, int line)
|
|
|
|
{
|
|
|
|
uint64_t start_time;
|
|
|
|
|
|
|
|
if (unlikely(l->info.cur_writer & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock for write */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (unlikely(l->info.cur_readers & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock for read */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
HA_ATOMIC_OR(&l->info.wait_writers, tid_bit);
|
|
|
|
|
|
|
|
start_time = nsec_now();
|
|
|
|
__RWLOCK_WRLOCK(&l->lock);
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].nsec_wait_for_write, (nsec_now() - start_time));
|
|
|
|
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].num_write_locked, 1);
|
|
|
|
|
|
|
|
l->info.cur_writer = tid_bit;
|
|
|
|
l->info.last_location.function = func;
|
|
|
|
l->info.last_location.file = file;
|
|
|
|
l->info.last_location.line = line;
|
|
|
|
|
|
|
|
HA_ATOMIC_AND(&l->info.wait_writers, ~tid_bit);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int __ha_rwlock_trywrlock(enum lock_label lbl, struct ha_rwlock *l,
|
|
|
|
const char *func, const char *file, int line)
|
|
|
|
{
|
|
|
|
uint64_t start_time;
|
|
|
|
int r;
|
|
|
|
|
|
|
|
if (unlikely(l->info.cur_writer & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock for write */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (unlikely(l->info.cur_readers & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock for read */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
/* We set waiting writer because trywrlock could wait for readers to quit */
|
|
|
|
HA_ATOMIC_OR(&l->info.wait_writers, tid_bit);
|
|
|
|
|
|
|
|
start_time = nsec_now();
|
|
|
|
r = __RWLOCK_TRYWRLOCK(&l->lock);
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].nsec_wait_for_write, (nsec_now() - start_time));
|
|
|
|
if (unlikely(r)) {
|
|
|
|
HA_ATOMIC_AND(&l->info.wait_writers, ~tid_bit);
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].num_write_locked, 1);
|
|
|
|
|
|
|
|
l->info.cur_writer = tid_bit;
|
|
|
|
l->info.last_location.function = func;
|
|
|
|
l->info.last_location.file = file;
|
|
|
|
l->info.last_location.line = line;
|
|
|
|
|
|
|
|
HA_ATOMIC_AND(&l->info.wait_writers, ~tid_bit);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __ha_rwlock_wrunlock(enum lock_label lbl,struct ha_rwlock *l,
|
|
|
|
const char *func, const char *file, int line)
|
|
|
|
{
|
|
|
|
if (unlikely(!(l->info.cur_writer & tid_bit))) {
|
|
|
|
/* the thread is not owning the lock for write */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
l->info.cur_writer = 0;
|
|
|
|
l->info.last_location.function = func;
|
|
|
|
l->info.last_location.file = file;
|
|
|
|
l->info.last_location.line = line;
|
|
|
|
|
|
|
|
__RWLOCK_WRUNLOCK(&l->lock);
|
|
|
|
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].num_write_unlocked, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __ha_rwlock_rdlock(enum lock_label lbl,struct ha_rwlock *l)
|
|
|
|
{
|
|
|
|
uint64_t start_time;
|
|
|
|
|
|
|
|
if (unlikely(l->info.cur_writer & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock for write */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (unlikely(l->info.cur_readers & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock for read */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
HA_ATOMIC_OR(&l->info.wait_readers, tid_bit);
|
|
|
|
|
|
|
|
start_time = nsec_now();
|
|
|
|
__RWLOCK_RDLOCK(&l->lock);
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].nsec_wait_for_read, (nsec_now() - start_time));
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].num_read_locked, 1);
|
|
|
|
|
|
|
|
HA_ATOMIC_OR(&l->info.cur_readers, tid_bit);
|
|
|
|
|
|
|
|
HA_ATOMIC_AND(&l->info.wait_readers, ~tid_bit);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int __ha_rwlock_tryrdlock(enum lock_label lbl,struct ha_rwlock *l)
|
|
|
|
{
|
|
|
|
int r;
|
|
|
|
|
|
|
|
if (unlikely(l->info.cur_writer & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock for write */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (unlikely(l->info.cur_readers & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock for read */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
/* try read should never wait */
|
|
|
|
r = __RWLOCK_TRYRDLOCK(&l->lock);
|
|
|
|
if (unlikely(r))
|
|
|
|
return r;
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].num_read_locked, 1);
|
|
|
|
|
|
|
|
HA_ATOMIC_OR(&l->info.cur_readers, tid_bit);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __ha_rwlock_rdunlock(enum lock_label lbl,struct ha_rwlock *l)
|
|
|
|
{
|
|
|
|
if (unlikely(!(l->info.cur_readers & tid_bit))) {
|
|
|
|
/* the thread is not owning the lock for read */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
HA_ATOMIC_AND(&l->info.cur_readers, ~tid_bit);
|
|
|
|
|
|
|
|
__RWLOCK_RDUNLOCK(&l->lock);
|
|
|
|
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].num_read_unlocked, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __spin_init(struct ha_spinlock *l)
|
|
|
|
{
|
|
|
|
memset(l, 0, sizeof(struct ha_spinlock));
|
|
|
|
__SPIN_INIT(&l->lock);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __spin_destroy(struct ha_spinlock *l)
|
|
|
|
{
|
|
|
|
__SPIN_DESTROY(&l->lock);
|
|
|
|
memset(l, 0, sizeof(struct ha_spinlock));
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __spin_lock(enum lock_label lbl, struct ha_spinlock *l,
|
|
|
|
const char *func, const char *file, int line)
|
|
|
|
{
|
|
|
|
uint64_t start_time;
|
|
|
|
|
|
|
|
if (unlikely(l->info.owner & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
HA_ATOMIC_OR(&l->info.waiters, tid_bit);
|
|
|
|
|
|
|
|
start_time = nsec_now();
|
|
|
|
__SPIN_LOCK(&l->lock);
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].nsec_wait_for_write, (nsec_now() - start_time));
|
|
|
|
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].num_write_locked, 1);
|
|
|
|
|
|
|
|
|
|
|
|
l->info.owner = tid_bit;
|
|
|
|
l->info.last_location.function = func;
|
|
|
|
l->info.last_location.file = file;
|
|
|
|
l->info.last_location.line = line;
|
|
|
|
|
|
|
|
HA_ATOMIC_AND(&l->info.waiters, ~tid_bit);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int __spin_trylock(enum lock_label lbl, struct ha_spinlock *l,
|
|
|
|
const char *func, const char *file, int line)
|
|
|
|
{
|
|
|
|
int r;
|
|
|
|
|
|
|
|
if (unlikely(l->info.owner & tid_bit)) {
|
|
|
|
/* the thread is already owning the lock */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
/* try read should never wait */
|
|
|
|
r = __SPIN_TRYLOCK(&l->lock);
|
|
|
|
if (unlikely(r))
|
|
|
|
return r;
|
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].num_write_locked, 1);
|
|
|
|
|
|
|
|
l->info.owner = tid_bit;
|
|
|
|
l->info.last_location.function = func;
|
|
|
|
l->info.last_location.file = file;
|
|
|
|
l->info.last_location.line = line;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void __spin_unlock(enum lock_label lbl, struct ha_spinlock *l,
|
|
|
|
const char *func, const char *file, int line)
|
|
|
|
{
|
|
|
|
if (unlikely(!(l->info.owner & tid_bit))) {
|
|
|
|
/* the thread is not owning the lock */
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
|
|
|
l->info.owner = 0;
|
|
|
|
l->info.last_location.function = func;
|
|
|
|
l->info.last_location.file = file;
|
|
|
|
l->info.last_location.line = line;
|
|
|
|
|
2017-11-02 15:26:02 +00:00
|
|
|
__SPIN_UNLOCK(&l->lock);
|
2017-10-12 14:09:09 +00:00
|
|
|
HA_ATOMIC_ADD(&lock_stats[lbl].num_write_unlocked, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
#else /* DEBUG_THREAD */
|
|
|
|
|
|
|
|
#define HA_SPINLOCK_T unsigned long
|
|
|
|
|
2017-11-07 09:42:54 +00:00
|
|
|
#define HA_SPIN_INIT(l) ({ (*l) = 0; })
|
|
|
|
#define HA_SPIN_DESTROY(l) ({ (*l) = 0; })
|
|
|
|
#define HA_SPIN_LOCK(lbl, l) pl_take_s(l)
|
|
|
|
#define HA_SPIN_TRYLOCK(lbl, l) !pl_try_s(l)
|
|
|
|
#define HA_SPIN_UNLOCK(lbl, l) pl_drop_s(l)
|
2017-10-12 14:09:09 +00:00
|
|
|
|
|
|
|
#define HA_RWLOCK_T unsigned long
|
|
|
|
|
2017-11-07 09:42:54 +00:00
|
|
|
#define HA_RWLOCK_INIT(l) ({ (*l) = 0; })
|
|
|
|
#define HA_RWLOCK_DESTROY(l) ({ (*l) = 0; })
|
|
|
|
#define HA_RWLOCK_WRLOCK(lbl,l) pl_take_w(l)
|
|
|
|
#define HA_RWLOCK_TRYWRLOCK(lbl,l) !pl_try_w(l)
|
|
|
|
#define HA_RWLOCK_WRUNLOCK(lbl,l) pl_drop_w(l)
|
|
|
|
#define HA_RWLOCK_RDLOCK(lbl,l) pl_take_r(l)
|
|
|
|
#define HA_RWLOCK_TRYRDLOCK(lbl,l) !pl_try_r(l)
|
|
|
|
#define HA_RWLOCK_RDUNLOCK(lbl,l) pl_drop_r(l)
|
2017-10-12 14:09:09 +00:00
|
|
|
|
|
|
|
#endif /* DEBUG_THREAD */
|
|
|
|
|
|
|
|
#endif /* USE_THREAD */
|
|
|
|
|
|
|
|
#endif /* _COMMON_HATHREADS_H */
|