mirror of
https://github.com/prometheus/node_exporter
synced 2025-01-25 14:42:58 +00:00
Merge pull request #1711 from prometheus/superq/cpu_cache
Linux CPU: Cache CPU metrics
This commit is contained in:
commit
7e7845a29f
@ -28,7 +28,7 @@ jobs:
|
|||||||
steps:
|
steps:
|
||||||
- checkout
|
- checkout
|
||||||
- run: sudo pip install codespell
|
- run: sudo pip install codespell
|
||||||
- run: codespell --skip=".git,./vendor,ttar,go.mod,go.sum,*pem" -L uint,packages\',uptodate
|
- run: codespell --skip=".git,./vendor,ttar,go.mod,go.sum,*pem,./collector/fixtures" -L uint,packages\',uptodate
|
||||||
|
|
||||||
build:
|
build:
|
||||||
machine:
|
machine:
|
||||||
|
@ -3,7 +3,7 @@
|
|||||||
* [CHANGE]
|
* [CHANGE]
|
||||||
* [FEATURE]
|
* [FEATURE]
|
||||||
* [ENHANCEMENT]
|
* [ENHANCEMENT]
|
||||||
* [BUGFIX]
|
* [BUGFIX] Linux CPU: Cache CPU metrics to make them monotonically increasing #1711
|
||||||
|
|
||||||
## 1.0.0-rc.1 / 2020-05-14
|
## 1.0.0-rc.1 / 2020-05-14
|
||||||
|
|
||||||
|
@ -19,6 +19,7 @@ import (
|
|||||||
"fmt"
|
"fmt"
|
||||||
"path/filepath"
|
"path/filepath"
|
||||||
"strconv"
|
"strconv"
|
||||||
|
"sync"
|
||||||
|
|
||||||
"github.com/go-kit/kit/log"
|
"github.com/go-kit/kit/log"
|
||||||
"github.com/go-kit/kit/log/level"
|
"github.com/go-kit/kit/log/level"
|
||||||
@ -35,6 +36,8 @@ type cpuCollector struct {
|
|||||||
cpuCoreThrottle *prometheus.Desc
|
cpuCoreThrottle *prometheus.Desc
|
||||||
cpuPackageThrottle *prometheus.Desc
|
cpuPackageThrottle *prometheus.Desc
|
||||||
logger log.Logger
|
logger log.Logger
|
||||||
|
cpuStats []procfs.CPUStat
|
||||||
|
cpuStatsMutex sync.Mutex
|
||||||
}
|
}
|
||||||
|
|
||||||
var (
|
var (
|
||||||
@ -203,7 +206,12 @@ func (c *cpuCollector) updateStat(ch chan<- prometheus.Metric) error {
|
|||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
for cpuID, cpuStat := range stats.CPU {
|
c.updateCPUStats(stats.CPU)
|
||||||
|
|
||||||
|
// Acquire a lock to read the stats.
|
||||||
|
c.cpuStatsMutex.Lock()
|
||||||
|
defer c.cpuStatsMutex.Unlock()
|
||||||
|
for cpuID, cpuStat := range c.cpuStats {
|
||||||
cpuNum := strconv.Itoa(cpuID)
|
cpuNum := strconv.Itoa(cpuID)
|
||||||
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.User, cpuNum, "user")
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.User, cpuNum, "user")
|
||||||
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.Nice, cpuNum, "nice")
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.Nice, cpuNum, "nice")
|
||||||
@ -221,3 +229,78 @@ func (c *cpuCollector) updateStat(ch chan<- prometheus.Metric) error {
|
|||||||
|
|
||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// updateCPUStats updates the internal cache of CPU stats.
|
||||||
|
func (c *cpuCollector) updateCPUStats(newStats []procfs.CPUStat) {
|
||||||
|
// Acquire a lock to update the stats.
|
||||||
|
c.cpuStatsMutex.Lock()
|
||||||
|
defer c.cpuStatsMutex.Unlock()
|
||||||
|
|
||||||
|
// Reset the cache if the list of CPUs has changed.
|
||||||
|
if len(c.cpuStats) != len(newStats) {
|
||||||
|
c.cpuStats = make([]procfs.CPUStat, len(newStats))
|
||||||
|
}
|
||||||
|
|
||||||
|
for i, n := range newStats {
|
||||||
|
// If idle jumps backwards, assume we had a hotplug event and reset the stats for this CPU.
|
||||||
|
if n.Idle < c.cpuStats[i].Idle {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU Idle counter jumped backwards, possible hotplug event, resetting CPU stats", "cpu", i, "old_value", c.cpuStats[i].Idle, "new_value", n.Idle)
|
||||||
|
c.cpuStats[i] = procfs.CPUStat{}
|
||||||
|
}
|
||||||
|
c.cpuStats[i].Idle = n.Idle
|
||||||
|
|
||||||
|
if n.User >= c.cpuStats[i].User {
|
||||||
|
c.cpuStats[i].User = n.User
|
||||||
|
} else {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU User counter jumped backwards", "cpu", i, "old_value", c.cpuStats[i].User, "new_value", n.User)
|
||||||
|
}
|
||||||
|
|
||||||
|
if n.Nice >= c.cpuStats[i].Nice {
|
||||||
|
c.cpuStats[i].Nice = n.Nice
|
||||||
|
} else {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU Nice counter jumped backwards", "cpu", i, "old_value", c.cpuStats[i].Nice, "new_value", n.Nice)
|
||||||
|
}
|
||||||
|
|
||||||
|
if n.System >= c.cpuStats[i].System {
|
||||||
|
c.cpuStats[i].System = n.System
|
||||||
|
} else {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU System counter jumped backwards", "cpu", i, "old_value", c.cpuStats[i].System, "new_value", n.System)
|
||||||
|
}
|
||||||
|
|
||||||
|
if n.Iowait >= c.cpuStats[i].Iowait {
|
||||||
|
c.cpuStats[i].Iowait = n.Iowait
|
||||||
|
} else {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU Iowait counter jumped backwards", "cpu", i, "old_value", c.cpuStats[i].Iowait, "new_value", n.Iowait)
|
||||||
|
}
|
||||||
|
|
||||||
|
if n.IRQ >= c.cpuStats[i].IRQ {
|
||||||
|
c.cpuStats[i].IRQ = n.IRQ
|
||||||
|
} else {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU IRQ counter jumped backwards", "cpu", i, "old_value", c.cpuStats[i].IRQ, "new_value", n.IRQ)
|
||||||
|
}
|
||||||
|
|
||||||
|
if n.SoftIRQ >= c.cpuStats[i].SoftIRQ {
|
||||||
|
c.cpuStats[i].SoftIRQ = n.SoftIRQ
|
||||||
|
} else {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU SoftIRQ counter jumped backwards", "cpu", i, "old_value", c.cpuStats[i].SoftIRQ, "new_value", n.SoftIRQ)
|
||||||
|
}
|
||||||
|
|
||||||
|
if n.Steal >= c.cpuStats[i].Steal {
|
||||||
|
c.cpuStats[i].Steal = n.Steal
|
||||||
|
} else {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU Steal counter jumped backwards", "cpu", i, "old_value", c.cpuStats[i].Steal, "new_value", n.Steal)
|
||||||
|
}
|
||||||
|
|
||||||
|
if n.Guest >= c.cpuStats[i].Guest {
|
||||||
|
c.cpuStats[i].Guest = n.Guest
|
||||||
|
} else {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU Guest counter jumped backwards", "cpu", i, "old_value", c.cpuStats[i].Guest, "new_value", n.Guest)
|
||||||
|
}
|
||||||
|
|
||||||
|
if n.GuestNice >= c.cpuStats[i].GuestNice {
|
||||||
|
c.cpuStats[i].GuestNice = n.GuestNice
|
||||||
|
} else {
|
||||||
|
level.Warn(c.logger).Log("msg", "CPU GuestNice counter jumped backwards", "cpu", i, "old_value", c.cpuStats[i].GuestNice, "new_value", n.GuestNice)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user