mirror of
http://git.haproxy.org/git/haproxy.git/
synced 2025-01-25 06:53:03 +00:00
REORG: clock: move the updates of cpu/mono time to clock.c
The entering_poll/leaving_poll/measure_idle functions that were hard to classify and used to move to various locations have now been placed into clock.c since it's precisely about time-keeping. The functions were renamed to clock_*. The samp_time and idle_time values are now static since there is no reason for them to be read from outside.
This commit is contained in:
parent
5554264f31
commit
f9d5e1079c
@ -41,5 +41,8 @@ void clock_update_date(int max_wait, int interrupted);
|
|||||||
void clock_init_process_date(void);
|
void clock_init_process_date(void);
|
||||||
void clock_init_thread_date(void);
|
void clock_init_thread_date(void);
|
||||||
char *timeofday_as_iso_us(int pad);
|
char *timeofday_as_iso_us(int pad);
|
||||||
|
uint clock_report_idle(void);
|
||||||
|
void clock_leaving_poll(int timeout, int interrupted);
|
||||||
|
void clock_entering_poll(void);
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
@ -93,9 +93,6 @@ extern volatile unsigned long global_tasks_mask; /* Mask of threads with tasks i
|
|||||||
extern unsigned int grq_total; /* total number of entries in the global run queue, atomic */
|
extern unsigned int grq_total; /* total number of entries in the global run queue, atomic */
|
||||||
extern unsigned int niced_tasks; /* number of niced tasks in the run queue */
|
extern unsigned int niced_tasks; /* number of niced tasks in the run queue */
|
||||||
|
|
||||||
extern THREAD_LOCAL unsigned int samp_time; /* total elapsed time over current sample */
|
|
||||||
extern THREAD_LOCAL unsigned int idle_time; /* total idle time over current sample */
|
|
||||||
|
|
||||||
extern struct pool_head *pool_head_task;
|
extern struct pool_head *pool_head_task;
|
||||||
extern struct pool_head *pool_head_tasklet;
|
extern struct pool_head *pool_head_tasklet;
|
||||||
extern struct pool_head *pool_head_notification;
|
extern struct pool_head *pool_head_notification;
|
||||||
@ -117,10 +114,6 @@ void tasklet_kill(struct tasklet *t);
|
|||||||
void __task_wakeup(struct task *t);
|
void __task_wakeup(struct task *t);
|
||||||
void __task_queue(struct task *task, struct eb_root *wq);
|
void __task_queue(struct task *task, struct eb_root *wq);
|
||||||
|
|
||||||
uint sched_report_idle();
|
|
||||||
void sched_leaving_poll(int timeout, int interrupted);
|
|
||||||
void sched_entering_poll();
|
|
||||||
|
|
||||||
unsigned int run_tasks_from_lists(unsigned int budgets[]);
|
unsigned int run_tasks_from_lists(unsigned int budgets[]);
|
||||||
|
|
||||||
/*
|
/*
|
||||||
|
92
src/clock.c
92
src/clock.c
@ -14,6 +14,7 @@
|
|||||||
#include <time.h>
|
#include <time.h>
|
||||||
|
|
||||||
#include <haproxy/api.h>
|
#include <haproxy/api.h>
|
||||||
|
#include <haproxy/activity.h>
|
||||||
#include <haproxy/clock.h>
|
#include <haproxy/clock.h>
|
||||||
#include <haproxy/time.h>
|
#include <haproxy/time.h>
|
||||||
#include <haproxy/tinfo-t.h>
|
#include <haproxy/tinfo-t.h>
|
||||||
@ -31,6 +32,8 @@ THREAD_LOCAL struct timeval date; /* the real current date (wall
|
|||||||
THREAD_LOCAL struct timeval before_poll; /* system date before calling poll() */
|
THREAD_LOCAL struct timeval before_poll; /* system date before calling poll() */
|
||||||
THREAD_LOCAL struct timeval after_poll; /* system date after leaving poll() */
|
THREAD_LOCAL struct timeval after_poll; /* system date after leaving poll() */
|
||||||
|
|
||||||
|
static THREAD_LOCAL unsigned int samp_time; /* total elapsed time over current sample */
|
||||||
|
static THREAD_LOCAL unsigned int idle_time; /* total idle time over current sample */
|
||||||
static THREAD_LOCAL unsigned int iso_time_sec; /* last iso time value for this thread */
|
static THREAD_LOCAL unsigned int iso_time_sec; /* last iso time value for this thread */
|
||||||
static THREAD_LOCAL char iso_time_str[34]; /* ISO time representation of gettimeofday() */
|
static THREAD_LOCAL char iso_time_str[34]; /* ISO time representation of gettimeofday() */
|
||||||
|
|
||||||
@ -212,6 +215,95 @@ void clock_init_thread_date(void)
|
|||||||
clock_update_date(0, 1);
|
clock_update_date(0, 1);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* report the average CPU idle percentage over all running threads, between 0 and 100 */
|
||||||
|
uint clock_report_idle(void)
|
||||||
|
{
|
||||||
|
uint total = 0;
|
||||||
|
uint rthr = 0;
|
||||||
|
uint thr;
|
||||||
|
|
||||||
|
for (thr = 0; thr < MAX_THREADS; thr++) {
|
||||||
|
if (!(all_threads_mask & (1UL << thr)))
|
||||||
|
continue;
|
||||||
|
total += HA_ATOMIC_LOAD(&ha_thread_info[thr].idle_pct);
|
||||||
|
rthr++;
|
||||||
|
}
|
||||||
|
return rthr ? total / rthr : 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Update the idle time value twice a second, to be called after
|
||||||
|
* clock_update_date() when called after poll(), and currently called only by
|
||||||
|
* clock_leaving_poll() below. It relies on <before_poll> to be updated to
|
||||||
|
* the system time before calling poll().
|
||||||
|
*/
|
||||||
|
static inline void clock_measure_idle(void)
|
||||||
|
{
|
||||||
|
/* Let's compute the idle to work ratio. We worked between after_poll
|
||||||
|
* and before_poll, and slept between before_poll and date. The idle_pct
|
||||||
|
* is updated at most twice every second. Note that the current second
|
||||||
|
* rarely changes so we avoid a multiply when not needed.
|
||||||
|
*/
|
||||||
|
int delta;
|
||||||
|
|
||||||
|
if ((delta = date.tv_sec - before_poll.tv_sec))
|
||||||
|
delta *= 1000000;
|
||||||
|
idle_time += delta + (date.tv_usec - before_poll.tv_usec);
|
||||||
|
|
||||||
|
if ((delta = date.tv_sec - after_poll.tv_sec))
|
||||||
|
delta *= 1000000;
|
||||||
|
samp_time += delta + (date.tv_usec - after_poll.tv_usec);
|
||||||
|
|
||||||
|
after_poll.tv_sec = date.tv_sec; after_poll.tv_usec = date.tv_usec;
|
||||||
|
if (samp_time < 500000)
|
||||||
|
return;
|
||||||
|
|
||||||
|
HA_ATOMIC_STORE(&ti->idle_pct, (100ULL * idle_time + samp_time / 2) / samp_time);
|
||||||
|
idle_time = samp_time = 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Collect date and time information after leaving poll(). <timeout> must be
|
||||||
|
* set to the maximum sleep time passed to poll (in milliseconds), and
|
||||||
|
* <interrupted> must be zero if the poller reached the timeout or non-zero
|
||||||
|
* otherwise, which generally is provided by the poller's return value.
|
||||||
|
*/
|
||||||
|
void clock_leaving_poll(int timeout, int interrupted)
|
||||||
|
{
|
||||||
|
clock_measure_idle();
|
||||||
|
ti->prev_cpu_time = now_cpu_time();
|
||||||
|
ti->prev_mono_time = now_mono_time();
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Collect date and time information before calling poll(). This will be used
|
||||||
|
* to count the run time of the past loop and the sleep time of the next poll.
|
||||||
|
* It also compares the elasped and cpu times during the activity period to
|
||||||
|
* estimate the amount of stolen time, which is reported if higher than half
|
||||||
|
* a millisecond.
|
||||||
|
*/
|
||||||
|
void clock_entering_poll(void)
|
||||||
|
{
|
||||||
|
uint64_t new_mono_time;
|
||||||
|
uint64_t new_cpu_time;
|
||||||
|
int64_t stolen;
|
||||||
|
|
||||||
|
gettimeofday(&before_poll, NULL);
|
||||||
|
|
||||||
|
new_cpu_time = now_cpu_time();
|
||||||
|
new_mono_time = now_mono_time();
|
||||||
|
|
||||||
|
if (ti->prev_cpu_time && ti->prev_mono_time) {
|
||||||
|
new_cpu_time -= ti->prev_cpu_time;
|
||||||
|
new_mono_time -= ti->prev_mono_time;
|
||||||
|
stolen = new_mono_time - new_cpu_time;
|
||||||
|
if (unlikely(stolen >= 500000)) {
|
||||||
|
stolen /= 500000;
|
||||||
|
/* more than half a millisecond difference might
|
||||||
|
* indicate an undesired preemption.
|
||||||
|
*/
|
||||||
|
report_stolen_time(stolen);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
/* returns the current date as returned by gettimeofday() in ISO+microsecond
|
/* returns the current date as returned by gettimeofday() in ISO+microsecond
|
||||||
* format. It uses a thread-local static variable that the reader can consume
|
* format. It uses a thread-local static variable that the reader can consume
|
||||||
* for as long as it wants until next call. Thus, do not call it from a signal
|
* for as long as it wants until next call. Thus, do not call it from a signal
|
||||||
|
@ -189,7 +189,7 @@ static void _do_poll(struct poller *p, int exp, int wake)
|
|||||||
|
|
||||||
/* now let's wait for polled events */
|
/* now let's wait for polled events */
|
||||||
wait_time = wake ? 0 : compute_poll_timeout(exp);
|
wait_time = wake ? 0 : compute_poll_timeout(exp);
|
||||||
sched_entering_poll();
|
clock_entering_poll();
|
||||||
activity_count_runtime();
|
activity_count_runtime();
|
||||||
do {
|
do {
|
||||||
int timeout = (global.tune.options & GTUNE_BUSY_POLLING) ? 0 : wait_time;
|
int timeout = (global.tune.options & GTUNE_BUSY_POLLING) ? 0 : wait_time;
|
||||||
@ -209,7 +209,7 @@ static void _do_poll(struct poller *p, int exp, int wake)
|
|||||||
break;
|
break;
|
||||||
} while (1);
|
} while (1);
|
||||||
|
|
||||||
sched_leaving_poll(wait_time, status);
|
clock_leaving_poll(wait_time, status);
|
||||||
|
|
||||||
thread_harmless_end();
|
thread_harmless_end();
|
||||||
thread_idle_end();
|
thread_idle_end();
|
||||||
|
@ -159,7 +159,7 @@ static void _do_poll(struct poller *p, int exp, int wake)
|
|||||||
* Determine how long to wait for events to materialise on the port.
|
* Determine how long to wait for events to materialise on the port.
|
||||||
*/
|
*/
|
||||||
wait_time = wake ? 0 : compute_poll_timeout(exp);
|
wait_time = wake ? 0 : compute_poll_timeout(exp);
|
||||||
sched_entering_poll();
|
clock_entering_poll();
|
||||||
activity_count_runtime();
|
activity_count_runtime();
|
||||||
|
|
||||||
do {
|
do {
|
||||||
@ -203,7 +203,7 @@ static void _do_poll(struct poller *p, int exp, int wake)
|
|||||||
break;
|
break;
|
||||||
} while(1);
|
} while(1);
|
||||||
|
|
||||||
sched_leaving_poll(wait_time, nevlist);
|
clock_leaving_poll(wait_time, nevlist);
|
||||||
|
|
||||||
thread_harmless_end();
|
thread_harmless_end();
|
||||||
thread_idle_end();
|
thread_idle_end();
|
||||||
|
@ -146,7 +146,7 @@ static void _do_poll(struct poller *p, int exp, int wake)
|
|||||||
/* now let's wait for events */
|
/* now let's wait for events */
|
||||||
wait_time = wake ? 0 : compute_poll_timeout(exp);
|
wait_time = wake ? 0 : compute_poll_timeout(exp);
|
||||||
fd = global.tune.maxpollevents;
|
fd = global.tune.maxpollevents;
|
||||||
sched_entering_poll();
|
clock_entering_poll();
|
||||||
activity_count_runtime();
|
activity_count_runtime();
|
||||||
|
|
||||||
do {
|
do {
|
||||||
@ -175,7 +175,7 @@ static void _do_poll(struct poller *p, int exp, int wake)
|
|||||||
break;
|
break;
|
||||||
} while (1);
|
} while (1);
|
||||||
|
|
||||||
sched_leaving_poll(wait_time, status);
|
clock_leaving_poll(wait_time, status);
|
||||||
|
|
||||||
thread_harmless_end();
|
thread_harmless_end();
|
||||||
thread_idle_end();
|
thread_idle_end();
|
||||||
|
@ -202,11 +202,11 @@ static void _do_poll(struct poller *p, int exp, int wake)
|
|||||||
|
|
||||||
/* now let's wait for events */
|
/* now let's wait for events */
|
||||||
wait_time = wake ? 0 : compute_poll_timeout(exp);
|
wait_time = wake ? 0 : compute_poll_timeout(exp);
|
||||||
sched_entering_poll();
|
clock_entering_poll();
|
||||||
activity_count_runtime();
|
activity_count_runtime();
|
||||||
status = poll(poll_events, nbfd, wait_time);
|
status = poll(poll_events, nbfd, wait_time);
|
||||||
clock_update_date(wait_time, status);
|
clock_update_date(wait_time, status);
|
||||||
sched_leaving_poll(wait_time, status);
|
clock_leaving_poll(wait_time, status);
|
||||||
|
|
||||||
thread_harmless_end();
|
thread_harmless_end();
|
||||||
thread_idle_end();
|
thread_idle_end();
|
||||||
|
@ -173,7 +173,7 @@ static void _do_poll(struct poller *p, int exp, int wake)
|
|||||||
delta_ms = wake ? 0 : compute_poll_timeout(exp);
|
delta_ms = wake ? 0 : compute_poll_timeout(exp);
|
||||||
delta.tv_sec = (delta_ms / 1000);
|
delta.tv_sec = (delta_ms / 1000);
|
||||||
delta.tv_usec = (delta_ms % 1000) * 1000;
|
delta.tv_usec = (delta_ms % 1000) * 1000;
|
||||||
sched_entering_poll();
|
clock_entering_poll();
|
||||||
activity_count_runtime();
|
activity_count_runtime();
|
||||||
status = select(maxfd,
|
status = select(maxfd,
|
||||||
readnotnull ? tmp_evts[DIR_RD] : NULL,
|
readnotnull ? tmp_evts[DIR_RD] : NULL,
|
||||||
@ -181,7 +181,7 @@ static void _do_poll(struct poller *p, int exp, int wake)
|
|||||||
NULL,
|
NULL,
|
||||||
&delta);
|
&delta);
|
||||||
clock_update_date(delta_ms, status);
|
clock_update_date(delta_ms, status);
|
||||||
sched_leaving_poll(delta_ms, status);
|
clock_leaving_poll(delta_ms, status);
|
||||||
|
|
||||||
thread_harmless_end();
|
thread_harmless_end();
|
||||||
thread_idle_end();
|
thread_idle_end();
|
||||||
|
@ -3448,7 +3448,7 @@ static void stats_dump_html_info(struct stream_interface *si, struct uri_auth *u
|
|||||||
actconn, pipes_used, pipes_used+pipes_free, read_freq_ctr(&global.conn_per_sec),
|
actconn, pipes_used, pipes_used+pipes_free, read_freq_ctr(&global.conn_per_sec),
|
||||||
bps >= 1000000000UL ? (bps / 1000000000.0) : bps >= 1000000UL ? (bps / 1000000.0) : (bps / 1000.0),
|
bps >= 1000000000UL ? (bps / 1000000000.0) : bps >= 1000000UL ? (bps / 1000000.0) : (bps / 1000.0),
|
||||||
bps >= 1000000000UL ? 'G' : bps >= 1000000UL ? 'M' : 'k',
|
bps >= 1000000000UL ? 'G' : bps >= 1000000UL ? 'M' : 'k',
|
||||||
total_run_queues(), total_allocated_tasks(), sched_report_idle()
|
total_run_queues(), total_allocated_tasks(), clock_report_idle()
|
||||||
);
|
);
|
||||||
|
|
||||||
/* scope_txt = search query, appctx->ctx.stats.scope_len is always <= STAT_SCOPE_TXT_MAXLEN */
|
/* scope_txt = search query, appctx->ctx.stats.scope_len is always <= STAT_SCOPE_TXT_MAXLEN */
|
||||||
@ -4481,7 +4481,7 @@ int stats_fill_info(struct field *info, int len, uint flags)
|
|||||||
#endif
|
#endif
|
||||||
info[INF_TASKS] = mkf_u32(0, total_allocated_tasks());
|
info[INF_TASKS] = mkf_u32(0, total_allocated_tasks());
|
||||||
info[INF_RUN_QUEUE] = mkf_u32(0, total_run_queues());
|
info[INF_RUN_QUEUE] = mkf_u32(0, total_run_queues());
|
||||||
info[INF_IDLE_PCT] = mkf_u32(FN_AVG, sched_report_idle());
|
info[INF_IDLE_PCT] = mkf_u32(FN_AVG, clock_report_idle());
|
||||||
info[INF_NODE] = mkf_str(FO_CONFIG|FN_OUTPUT|FS_SERVICE, global.node);
|
info[INF_NODE] = mkf_str(FO_CONFIG|FN_OUTPUT|FS_SERVICE, global.node);
|
||||||
if (global.desc)
|
if (global.desc)
|
||||||
info[INF_DESCRIPTION] = mkf_str(FO_CONFIG|FN_OUTPUT|FS_SERVICE, global.desc);
|
info[INF_DESCRIPTION] = mkf_str(FO_CONFIG|FN_OUTPUT|FS_SERVICE, global.desc);
|
||||||
|
93
src/task.c
93
src/task.c
@ -38,10 +38,6 @@ DECLARE_POOL(pool_head_notification, "notification", sizeof(struct notification)
|
|||||||
volatile unsigned long global_tasks_mask = 0; /* Mask of threads with tasks in the global runqueue */
|
volatile unsigned long global_tasks_mask = 0; /* Mask of threads with tasks in the global runqueue */
|
||||||
unsigned int niced_tasks = 0; /* number of niced tasks in the run queue */
|
unsigned int niced_tasks = 0; /* number of niced tasks in the run queue */
|
||||||
|
|
||||||
/* used for idle time calculation */
|
|
||||||
THREAD_LOCAL unsigned int samp_time = 0; /* total elapsed time over current sample */
|
|
||||||
THREAD_LOCAL unsigned int idle_time = 0; /* total idle time over current sample */
|
|
||||||
|
|
||||||
THREAD_LOCAL struct task_per_thread *sched = &task_per_thread[0]; /* scheduler context for the current thread */
|
THREAD_LOCAL struct task_per_thread *sched = &task_per_thread[0]; /* scheduler context for the current thread */
|
||||||
|
|
||||||
__decl_aligned_spinlock(rq_lock); /* spin lock related to run queue */
|
__decl_aligned_spinlock(rq_lock); /* spin lock related to run queue */
|
||||||
@ -865,95 +861,6 @@ void process_runnable_tasks()
|
|||||||
activity[tid].long_rq++;
|
activity[tid].long_rq++;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* report the average CPU idle percentage over all running threads, between 0 and 100 */
|
|
||||||
uint sched_report_idle()
|
|
||||||
{
|
|
||||||
uint total = 0;
|
|
||||||
uint rthr = 0;
|
|
||||||
uint thr;
|
|
||||||
|
|
||||||
for (thr = 0; thr < MAX_THREADS; thr++) {
|
|
||||||
if (!(all_threads_mask & (1UL << thr)))
|
|
||||||
continue;
|
|
||||||
total += HA_ATOMIC_LOAD(&ha_thread_info[thr].idle_pct);
|
|
||||||
rthr++;
|
|
||||||
}
|
|
||||||
return rthr ? total / rthr : 0;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Update the idle time value twice a second, to be called after
|
|
||||||
* clock_update_date() when called after poll(), and currently called only by
|
|
||||||
* sched_leaving_poll() below. It relies on <before_poll> to be updated to
|
|
||||||
* the system time before calling poll().
|
|
||||||
*/
|
|
||||||
static inline void sched_measure_idle()
|
|
||||||
{
|
|
||||||
/* Let's compute the idle to work ratio. We worked between after_poll
|
|
||||||
* and before_poll, and slept between before_poll and date. The idle_pct
|
|
||||||
* is updated at most twice every second. Note that the current second
|
|
||||||
* rarely changes so we avoid a multiply when not needed.
|
|
||||||
*/
|
|
||||||
int delta;
|
|
||||||
|
|
||||||
if ((delta = date.tv_sec - before_poll.tv_sec))
|
|
||||||
delta *= 1000000;
|
|
||||||
idle_time += delta + (date.tv_usec - before_poll.tv_usec);
|
|
||||||
|
|
||||||
if ((delta = date.tv_sec - after_poll.tv_sec))
|
|
||||||
delta *= 1000000;
|
|
||||||
samp_time += delta + (date.tv_usec - after_poll.tv_usec);
|
|
||||||
|
|
||||||
after_poll.tv_sec = date.tv_sec; after_poll.tv_usec = date.tv_usec;
|
|
||||||
if (samp_time < 500000)
|
|
||||||
return;
|
|
||||||
|
|
||||||
HA_ATOMIC_STORE(&ti->idle_pct, (100ULL * idle_time + samp_time / 2) / samp_time);
|
|
||||||
idle_time = samp_time = 0;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Collect date and time information after leaving poll(). <timeout> must be
|
|
||||||
* set to the maximum sleep time passed to poll (in milliseconds), and
|
|
||||||
* <interrupted> must be zero if the poller reached the timeout or non-zero
|
|
||||||
* otherwise, which generally is provided by the poller's return value.
|
|
||||||
*/
|
|
||||||
void sched_leaving_poll(int timeout, int interrupted)
|
|
||||||
{
|
|
||||||
sched_measure_idle();
|
|
||||||
ti->prev_cpu_time = now_cpu_time();
|
|
||||||
ti->prev_mono_time = now_mono_time();
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Collect date and time information before calling poll(). This will be used
|
|
||||||
* to count the run time of the past loop and the sleep time of the next poll.
|
|
||||||
* It also compares the elasped and cpu times during the activity period to
|
|
||||||
* estimate the amount of stolen time, which is reported if higher than half
|
|
||||||
* a millisecond.
|
|
||||||
*/
|
|
||||||
void sched_entering_poll()
|
|
||||||
{
|
|
||||||
uint64_t new_mono_time;
|
|
||||||
uint64_t new_cpu_time;
|
|
||||||
int64_t stolen;
|
|
||||||
|
|
||||||
gettimeofday(&before_poll, NULL);
|
|
||||||
|
|
||||||
new_cpu_time = now_cpu_time();
|
|
||||||
new_mono_time = now_mono_time();
|
|
||||||
|
|
||||||
if (ti->prev_cpu_time && ti->prev_mono_time) {
|
|
||||||
new_cpu_time -= ti->prev_cpu_time;
|
|
||||||
new_mono_time -= ti->prev_mono_time;
|
|
||||||
stolen = new_mono_time - new_cpu_time;
|
|
||||||
if (unlikely(stolen >= 500000)) {
|
|
||||||
stolen /= 500000;
|
|
||||||
/* more than half a millisecond difference might
|
|
||||||
* indicate an undesired preemption.
|
|
||||||
*/
|
|
||||||
report_stolen_time(stolen);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Delete every tasks before running the master polling loop
|
* Delete every tasks before running the master polling loop
|
||||||
*/
|
*/
|
||||||
|
Loading…
Reference in New Issue
Block a user