mirror of
http://git.haproxy.org/git/haproxy.git/
synced 2025-04-01 22:48:25 +00:00
MINOR: activity: enable automatic profiling turn on/off
Instead of having to manually turn task profiling on/off in the configuration, by default it will work in "auto" mode, which automatically turns on on any thread experiencing sustained loop latencies over one millisecond averaged over the last 1024 samples. This may happen with configs using lots of regex (thing map_reg for example, which is the lazy way to convert Apache's rewrite rules but must not be abused), and such high latencies affect all the process and the problem is most often intermittent (e.g. hitting a map which is only used for certain host names). Thus now by default, with profiling set to "auto", it remains off all the time until something bad happens. This also helps better focus on the issues when looking at the logs as well as in "show sess" output. It automatically turns off when the average loop latency over the last 1024 calls goes below 990 microseconds (which typically takes a while when in idle). This patch could be backported to stable versions after a bit more exposure, as it definitely improves observability and the ability to quickly spot the culprit. In this case, previous patch ("MINOR: activity: make the profiling status per thread and not global") must also be taken.
This commit is contained in:
parent
d9add3acc8
commit
d2d3348acb
@ -1462,11 +1462,22 @@ noreuseport
|
||||
Disables the use of SO_REUSEPORT - see socket(7). It is equivalent to the
|
||||
command line argument "-dR".
|
||||
|
||||
profiling.tasks { on | off }
|
||||
Enables ('on') or disables ('off') per-task CPU profiling. CPU profiling per
|
||||
task can be very convenient to report where the time is spent and which
|
||||
requests have what effect on which other request. It is not enabled by
|
||||
default as it may consume a little bit extra CPU. This requires a system
|
||||
profiling.tasks { auto | on | off }
|
||||
Enables ('on') or disables ('off') per-task CPU profiling. When set to 'auto'
|
||||
the profiling automatically turns on a thread when it starts to suffer from
|
||||
an average latency of 1000 microseconds or higher as reported in the
|
||||
"avg_loop_us" activity field, and automatically turns off when the latency
|
||||
reutnrs below 990 microseconds (this value is an average over the last 1024
|
||||
loops so it does not vary quickly and tends to significantly smooth short
|
||||
spikes). It may also spontaneously trigger from time to time on overloaded
|
||||
systems, containers, or virtual machines, or when the system swaps (which
|
||||
must absolutely never happen on a load balancer).
|
||||
|
||||
CPU profiling per task can be very convenient to report where the time is
|
||||
spent and which requests have what effect on which other request. Enabling
|
||||
it will typically affect the overall's performance by less than 1%, thus it
|
||||
is recommended to leave it to the default 'auto' value so that it only
|
||||
operates when a problem is identified. This feature requires a system
|
||||
supporting the clock_gettime(2) syscall with clock identifiers
|
||||
CLOCK_MONOTONIC and CLOCK_THREAD_CPUTIME_ID, otherwise the reported time will
|
||||
be zero. This option may be changed at run time using "set profiling" on the
|
||||
|
@ -1667,7 +1667,7 @@ set maxconn global <maxconn>
|
||||
delayed until the threshold is reached. A value of zero restores the initial
|
||||
setting.
|
||||
|
||||
set profiling { tasks } { on | off }
|
||||
set profiling { tasks } { auto | on | off }
|
||||
Enables or disables CPU profiling for the indicated subsystem. This is
|
||||
equivalent to setting or clearing the "profiling" settings in the "global"
|
||||
section of the configuration file. Please also see "show profiling".
|
||||
|
@ -29,7 +29,10 @@
|
||||
#include <proto/freq_ctr.h>
|
||||
|
||||
/* bit fields for "profiling" */
|
||||
#define HA_PROF_TASKS 0x00000001 /* enable per-task CPU profiling */
|
||||
#define HA_PROF_TASKS_OFF 0x00000000 /* per-task CPU profiling forced disabled */
|
||||
#define HA_PROF_TASKS_AUTO 0x00000001 /* per-task CPU profiling automatic */
|
||||
#define HA_PROF_TASKS_ON 0x00000002 /* per-task CPU profiling forced enabled */
|
||||
#define HA_PROF_TASKS_MASK 0x00000003 /* per-task CPU profiling mask */
|
||||
|
||||
extern unsigned int profiling;
|
||||
extern unsigned long task_profiling_mask;
|
||||
@ -49,6 +52,13 @@ static inline void activity_count_runtime()
|
||||
uint64_t new_cpu_time;
|
||||
int64_t stolen;
|
||||
uint32_t run_time;
|
||||
uint32_t up, down;
|
||||
|
||||
/* 1 millisecond per loop on average over last 1024 iterations is
|
||||
* enough to turn on profiling.
|
||||
*/
|
||||
up = 1000;
|
||||
down = up * 99 / 100;
|
||||
|
||||
new_cpu_time = now_cpu_time();
|
||||
new_mono_time = now_mono_time();
|
||||
@ -69,12 +79,22 @@ static inline void activity_count_runtime()
|
||||
run_time = (before_poll.tv_sec - after_poll.tv_sec) * 1000000U + (before_poll.tv_usec - after_poll.tv_usec);
|
||||
swrate_add(&activity[tid].avg_loop_us, TIME_STATS_SAMPLES, run_time);
|
||||
|
||||
/* reaching the "up" threshold on average switches profiling to "on"
|
||||
* when automatic, and going back below the "down" threshold switches
|
||||
* to off.
|
||||
*/
|
||||
if (!(task_profiling_mask & tid_bit)) {
|
||||
if (unlikely(profiling & HA_PROF_TASKS))
|
||||
_HA_ATOMIC_OR(&task_profiling_mask, tid_bit);
|
||||
if (unlikely((profiling & HA_PROF_TASKS_MASK) == HA_PROF_TASKS_ON ||
|
||||
((profiling & HA_PROF_TASKS_MASK) == HA_PROF_TASKS_AUTO && run_time >= up))) {
|
||||
if (swrate_avg(activity[tid].avg_loop_us, TIME_STATS_SAMPLES) >= up)
|
||||
_HA_ATOMIC_OR(&task_profiling_mask, tid_bit);
|
||||
}
|
||||
} else {
|
||||
if (unlikely(!(profiling & HA_PROF_TASKS)))
|
||||
_HA_ATOMIC_AND(&task_profiling_mask, ~tid_bit);
|
||||
if (unlikely((profiling & HA_PROF_TASKS_MASK) == HA_PROF_TASKS_OFF ||
|
||||
((profiling & HA_PROF_TASKS_MASK) == HA_PROF_TASKS_AUTO && run_time <= down))) {
|
||||
if (swrate_avg(activity[tid].avg_loop_us, TIME_STATS_SAMPLES) <= down)
|
||||
_HA_ATOMIC_AND(&task_profiling_mask, ~tid_bit);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -23,7 +23,7 @@
|
||||
|
||||
|
||||
/* bit field of profiling options. Beware, may be modified at runtime! */
|
||||
unsigned int profiling = 0;
|
||||
unsigned int profiling = HA_PROF_TASKS_AUTO;
|
||||
unsigned long task_profiling_mask = 0;
|
||||
|
||||
/* One struct per thread containing all collected measurements */
|
||||
@ -49,11 +49,13 @@ static int cfg_parse_prof_tasks(char **args, int section_type, struct proxy *cur
|
||||
return -1;
|
||||
|
||||
if (strcmp(args[1], "on") == 0)
|
||||
profiling |= HA_PROF_TASKS;
|
||||
profiling = (profiling & ~HA_PROF_TASKS_MASK) | HA_PROF_TASKS_ON;
|
||||
else if (strcmp(args[1], "auto") == 0)
|
||||
profiling = (profiling & ~HA_PROF_TASKS_MASK) | HA_PROF_TASKS_AUTO;
|
||||
else if (strcmp(args[1], "off") == 0)
|
||||
profiling &= ~HA_PROF_TASKS;
|
||||
profiling = (profiling & ~HA_PROF_TASKS_MASK) | HA_PROF_TASKS_OFF;
|
||||
else {
|
||||
memprintf(err, "'%s' expects either 'on' or 'off' but got '%s'.", args[0], args[1]);
|
||||
memprintf(err, "'%s' expects either 'on', 'auto', or 'off' but got '%s'.", args[0], args[1]);
|
||||
return -1;
|
||||
}
|
||||
return 0;
|
||||
@ -62,27 +64,34 @@ static int cfg_parse_prof_tasks(char **args, int section_type, struct proxy *cur
|
||||
/* parse a "set profiling" command. It always returns 1. */
|
||||
static int cli_parse_set_profiling(char **args, char *payload, struct appctx *appctx, void *private)
|
||||
{
|
||||
unsigned int bit = 0;
|
||||
|
||||
if (!cli_has_level(appctx, ACCESS_LVL_ADMIN))
|
||||
return 1;
|
||||
|
||||
if (strcmp(args[2], "tasks") == 0)
|
||||
bit = HA_PROF_TASKS;
|
||||
else {
|
||||
if (strcmp(args[2], "tasks") != 0) {
|
||||
appctx->ctx.cli.severity = LOG_ERR;
|
||||
appctx->ctx.cli.msg = "Expects 'tasks'.\n";
|
||||
appctx->st0 = CLI_ST_PRINT;
|
||||
return 1;
|
||||
}
|
||||
|
||||
if (strcmp(args[3], "on") == 0)
|
||||
_HA_ATOMIC_OR(&profiling, bit);
|
||||
else if (strcmp(args[3], "off") == 0)
|
||||
_HA_ATOMIC_AND(&profiling, ~bit);
|
||||
if (strcmp(args[3], "on") == 0) {
|
||||
unsigned int old = profiling;
|
||||
while (!_HA_ATOMIC_CAS(&profiling, &old, (old & ~HA_PROF_TASKS_MASK) | HA_PROF_TASKS_ON))
|
||||
;
|
||||
}
|
||||
else if (strcmp(args[3], "auto") == 0) {
|
||||
unsigned int old = profiling;
|
||||
while (!_HA_ATOMIC_CAS(&profiling, &old, (old & ~HA_PROF_TASKS_MASK) | HA_PROF_TASKS_AUTO))
|
||||
;
|
||||
}
|
||||
else if (strcmp(args[3], "off") == 0) {
|
||||
unsigned int old = profiling;
|
||||
while (!_HA_ATOMIC_CAS(&profiling, &old, (old & ~HA_PROF_TASKS_MASK) | HA_PROF_TASKS_OFF))
|
||||
;
|
||||
}
|
||||
else {
|
||||
appctx->ctx.cli.severity = LOG_ERR;
|
||||
appctx->ctx.cli.msg = "Expects either 'on' or 'off'.\n";
|
||||
appctx->ctx.cli.msg = "Expects 'on', 'auto', or 'off'.\n";
|
||||
appctx->st0 = CLI_ST_PRINT;
|
||||
return 1;
|
||||
}
|
||||
@ -95,14 +104,22 @@ static int cli_parse_set_profiling(char **args, char *payload, struct appctx *ap
|
||||
static int cli_io_handler_show_profiling(struct appctx *appctx)
|
||||
{
|
||||
struct stream_interface *si = appctx->owner;
|
||||
const char *str;
|
||||
|
||||
if (unlikely(si_ic(si)->flags & (CF_WRITE_ERROR|CF_SHUTW)))
|
||||
return 1;
|
||||
|
||||
chunk_reset(&trash);
|
||||
|
||||
chunk_printf(&trash, "Per-task CPU profiling : %s # set profiling tasks {on|off}\n",
|
||||
(profiling & HA_PROF_TASKS) ? "on" : "off");
|
||||
switch (profiling & HA_PROF_TASKS_MASK) {
|
||||
case HA_PROF_TASKS_AUTO: str="auto"; break;
|
||||
case HA_PROF_TASKS_ON: str="on"; break;
|
||||
default: str="off"; break;
|
||||
}
|
||||
|
||||
chunk_printf(&trash,
|
||||
"Per-task CPU profiling : %s # set profiling tasks {on|auto|off}\n",
|
||||
str);
|
||||
|
||||
if (ci_putchk(si_ic(si), &trash) == -1) {
|
||||
/* failed, try again */
|
||||
|
@ -3449,7 +3449,7 @@ void http_end_txn_clean_session(struct stream *s)
|
||||
s->task->calls = 0;
|
||||
s->task->cpu_time = 0;
|
||||
s->task->lat_time = 0;
|
||||
s->task->call_date = (profiling & HA_PROF_TASKS) ? now_mono_time() : 0;
|
||||
s->task->call_date = ((profiling & HA_PROF_TASKS_MASK) >= HA_PROF_TASKS_AUTO) ? now_mono_time() : 0;
|
||||
|
||||
s->logs.accept_date = date; /* user-visible date for logging */
|
||||
s->logs.tv_accept = now; /* corrected date for internal use */
|
||||
|
Loading…
Reference in New Issue
Block a user