alertmanager/types/types.go

473 lines
13 KiB
Go
Raw Normal View History

2015-10-11 15:24:49 +00:00
// Copyright 2015 Prometheus Team
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
2015-09-25 12:38:22 +00:00
package types
2015-09-25 16:14:46 +00:00
import (
2015-10-11 10:40:43 +00:00
"strings"
"sync"
2015-09-25 16:14:46 +00:00
"time"
"github.com/prometheus/client_golang/prometheus"
2015-09-25 16:14:46 +00:00
"github.com/prometheus/common/model"
)
// AlertState is used as part of AlertStatus.
2017-05-10 09:49:02 +00:00
type AlertState string
2017-04-27 12:18:52 +00:00
// Possible values for AlertState.
2017-04-27 12:18:52 +00:00
const (
2017-05-10 09:49:02 +00:00
AlertStateUnprocessed AlertState = "unprocessed"
AlertStateActive AlertState = "active"
AlertStateSuppressed AlertState = "suppressed"
2017-04-27 12:18:52 +00:00
)
// AlertStatus stores the state of an alert and, as applicable, the IDs of
// silences silencing the alert and of other alerts inhibiting the alert. Note
// that currently, SilencedBy is supposed to be the complete set of the relevant
// silences while InhibitedBy may contain only a subset of the inhibiting alerts
// in practice exactly one ID. (This somewhat confusing semantics might change
// in the future.)
2017-04-27 12:18:52 +00:00
type AlertStatus struct {
2017-05-10 09:49:02 +00:00
State AlertState `json:"state"`
SilencedBy []string `json:"silencedBy"`
InhibitedBy []string `json:"inhibitedBy"`
silencesVersion int
2017-04-27 12:18:52 +00:00
}
// Marker helps to mark alerts as silenced and/or inhibited.
// All methods are goroutine-safe.
type Marker interface {
// SetActive sets the provided alert to AlertStateActive and deletes all
// SilencedBy and InhibitedBy entries.
2017-04-27 12:18:52 +00:00
SetActive(alert model.Fingerprint)
// SetSilenced replaces the previous SilencedBy by the provided IDs of
// silences, including the version number of the silences state. The set
// of provided IDs is supposed to represent the complete set of relevant
// silences. If no ID is provided and InhibitedBy is already empty, this
// call is equivalent to SetActive. Otherwise, it sets
// AlertStateSuppressed.
SetSilenced(alert model.Fingerprint, version int, silenceIDs ...string)
// SetInhibited replaces the previous InhibitedBy by the provided IDs of
// alerts. In contrast to SetSilenced, the set of provided IDs is not
// expected to represent the complete set of inhibiting alerts. (In
// practice, this method is only called with one or zero IDs. However,
// this expectation might change in the future.) If no ID is provided and
// SilencedBy is already empty, this call is equivalent to
// SetActive. Otherwise, it sets AlertStateSuppressed.
SetInhibited(alert model.Fingerprint, alertIDs ...string)
// Count alerts of the given state(s). With no state provided, count all
// alerts.
Count(...AlertState) int
// Status of the given alert.
2017-04-27 12:18:52 +00:00
Status(model.Fingerprint) AlertStatus
// Delete the given alert.
2017-04-27 12:18:52 +00:00
Delete(model.Fingerprint)
// Various methods to inquire if the given alert is in a certain
// AlertState. Silenced also returns all the silencing silences, while
// Inhibited may return only a subset of inhibiting alerts. Silenced
// also returns the version of the silences state the result is based
// on.
2017-04-27 12:18:52 +00:00
Unprocessed(model.Fingerprint) bool
Active(model.Fingerprint) bool
Silenced(model.Fingerprint) ([]string, int, bool)
2017-04-27 12:18:52 +00:00
Inhibited(model.Fingerprint) ([]string, bool)
}
// NewMarker returns an instance of a Marker implementation.
func NewMarker(r prometheus.Registerer) Marker {
m := &memMarker{
2017-04-27 12:18:52 +00:00
m: map[model.Fingerprint]*AlertStatus{},
}
m.registerMetrics(r)
return m
}
type memMarker struct {
2017-04-27 12:18:52 +00:00
m map[model.Fingerprint]*AlertStatus
mtx sync.RWMutex
}
func (m *memMarker) registerMetrics(r prometheus.Registerer) {
newAlertMetricByState := func(st AlertState) prometheus.GaugeFunc {
return prometheus.NewGaugeFunc(
prometheus.GaugeOpts{
Name: "alertmanager_alerts",
Help: "How many alerts by state.",
ConstLabels: prometheus.Labels{"state": string(st)},
},
func() float64 {
return float64(m.Count(st))
},
)
}
alertsActive := newAlertMetricByState(AlertStateActive)
alertsSuppressed := newAlertMetricByState(AlertStateSuppressed)
r.MustRegister(alertsActive)
r.MustRegister(alertsSuppressed)
}
// Count implements Marker.
func (m *memMarker) Count(states ...AlertState) int {
count := 0
m.mtx.RLock()
defer m.mtx.RUnlock()
if len(states) == 0 {
count = len(m.m)
} else {
for _, status := range m.m {
for _, state := range states {
if status.State == state {
2017-11-01 22:08:34 +00:00
count++
}
}
}
}
return count
}
// SetSilenced implements Marker.
func (m *memMarker) SetSilenced(alert model.Fingerprint, version int, ids ...string) {
2017-05-10 09:49:02 +00:00
m.mtx.Lock()
2017-04-27 12:18:52 +00:00
s, found := m.m[alert]
if !found {
s = &AlertStatus{}
m.m[alert] = s
}
s.silencesVersion = version
2017-04-27 12:18:52 +00:00
// If there are any silence or alert IDs associated with the
// fingerprint, it is suppressed. Otherwise, set it to
// AlertStateUnprocessed.
if len(ids) == 0 && len(s.InhibitedBy) == 0 {
2017-05-10 09:49:02 +00:00
m.mtx.Unlock()
2017-04-27 12:18:52 +00:00
m.SetActive(alert)
return
}
2017-05-10 09:49:02 +00:00
s.State = AlertStateSuppressed
2017-04-27 12:18:52 +00:00
s.SilencedBy = ids
2017-05-10 09:49:02 +00:00
m.mtx.Unlock()
}
// SetInhibited implements Marker.
2017-04-27 12:18:52 +00:00
func (m *memMarker) SetInhibited(alert model.Fingerprint, ids ...string) {
2017-05-10 09:49:02 +00:00
m.mtx.Lock()
2017-04-27 12:18:52 +00:00
s, found := m.m[alert]
if !found {
s = &AlertStatus{}
m.m[alert] = s
}
// If there are any silence or alert IDs associated with the
// fingerprint, it is suppressed. Otherwise, set it to
// AlertStateUnprocessed.
if len(ids) == 0 && len(s.SilencedBy) == 0 {
2017-05-10 09:49:02 +00:00
m.mtx.Unlock()
2017-04-27 12:18:52 +00:00
m.SetActive(alert)
return
}
2017-05-10 09:49:02 +00:00
s.State = AlertStateSuppressed
2017-04-27 12:18:52 +00:00
s.InhibitedBy = ids
2017-05-10 09:49:02 +00:00
m.mtx.Unlock()
2017-04-27 12:18:52 +00:00
}
2017-05-10 09:49:02 +00:00
// SetActive implements Marker.
2017-04-27 12:18:52 +00:00
func (m *memMarker) SetActive(alert model.Fingerprint) {
2017-05-10 09:49:02 +00:00
m.mtx.Lock()
defer m.mtx.Unlock()
2017-04-27 12:18:52 +00:00
s, found := m.m[alert]
if !found {
2017-05-10 09:49:02 +00:00
s = &AlertStatus{
SilencedBy: []string{},
InhibitedBy: []string{},
}
2017-04-27 12:18:52 +00:00
m.m[alert] = s
}
2017-04-27 12:18:52 +00:00
2017-05-10 09:49:02 +00:00
s.State = AlertStateActive
2017-04-27 12:18:52 +00:00
s.SilencedBy = []string{}
s.InhibitedBy = []string{}
}
// Status implements Marker.
2017-04-27 12:18:52 +00:00
func (m *memMarker) Status(alert model.Fingerprint) AlertStatus {
m.mtx.RLock()
defer m.mtx.RUnlock()
2017-04-27 12:18:52 +00:00
s, found := m.m[alert]
if !found {
2017-05-10 09:49:02 +00:00
s = &AlertStatus{
State: AlertStateUnprocessed,
SilencedBy: []string{},
InhibitedBy: []string{},
}
}
2017-04-27 12:18:52 +00:00
return *s
}
// Delete implements Marker.
2017-04-27 12:18:52 +00:00
func (m *memMarker) Delete(alert model.Fingerprint) {
2017-05-10 09:49:02 +00:00
m.mtx.Lock()
defer m.mtx.Unlock()
2017-04-27 12:18:52 +00:00
delete(m.m, alert)
}
// Unprocessed implements Marker.
2017-04-27 12:18:52 +00:00
func (m *memMarker) Unprocessed(alert model.Fingerprint) bool {
2017-05-10 09:49:02 +00:00
return m.Status(alert).State == AlertStateUnprocessed
2017-04-27 12:18:52 +00:00
}
// Active implements Marker.
2017-04-27 12:18:52 +00:00
func (m *memMarker) Active(alert model.Fingerprint) bool {
2017-05-10 09:49:02 +00:00
return m.Status(alert).State == AlertStateActive
2017-04-27 12:18:52 +00:00
}
// Inhibited implements Marker.
2017-04-27 12:18:52 +00:00
func (m *memMarker) Inhibited(alert model.Fingerprint) ([]string, bool) {
s := m.Status(alert)
return s.InhibitedBy,
2017-05-10 09:49:02 +00:00
s.State == AlertStateSuppressed && len(s.InhibitedBy) > 0
2017-04-27 12:18:52 +00:00
}
// Silenced returns whether the alert for the given Fingerprint is in the
// Silenced state, any associated silence IDs, and the silences state version
// the result is based on.
func (m *memMarker) Silenced(alert model.Fingerprint) ([]string, int, bool) {
2017-04-27 12:18:52 +00:00
s := m.Status(alert)
return s.SilencedBy, s.silencesVersion,
2017-05-10 09:49:02 +00:00
s.State == AlertStateSuppressed && len(s.SilencedBy) > 0
}
// MultiError contains multiple errors and implements the error interface. Its
// zero value is ready to use. All its methods are goroutine safe.
type MultiError struct {
mtx sync.Mutex
errors []error
}
// Add adds an error to the MultiError.
func (e *MultiError) Add(err error) {
e.mtx.Lock()
defer e.mtx.Unlock()
e.errors = append(e.errors, err)
}
// Len returns the number of errors added to the MultiError.
func (e *MultiError) Len() int {
e.mtx.Lock()
defer e.mtx.Unlock()
return len(e.errors)
}
// Errors returns the errors added to the MuliError. The returned slice is a
// copy of the internal slice of errors.
func (e *MultiError) Errors() []error {
e.mtx.Lock()
defer e.mtx.Unlock()
return append(make([]error, 0, len(e.errors)), e.errors...)
}
func (e *MultiError) Error() string {
e.mtx.Lock()
defer e.mtx.Unlock()
2015-10-11 10:40:43 +00:00
es := make([]string, 0, len(e.errors))
for _, err := range e.errors {
2015-10-11 10:40:43 +00:00
es = append(es, err.Error())
}
return strings.Join(es, "; ")
}
2015-10-01 12:53:49 +00:00
// Alert wraps a model.Alert with additional information relevant
// to internal of the Alertmanager.
// The type is never exposed to external communication and the
// embedded alert has to be sanitized beforehand.
2015-09-25 12:38:22 +00:00
type Alert struct {
2015-10-01 12:53:49 +00:00
model.Alert
2015-09-25 12:38:22 +00:00
// The authoritative timestamp.
UpdatedAt time.Time
Timeout bool
}
// AlertSlice is a sortable slice of Alerts.
2015-10-27 17:24:09 +00:00
type AlertSlice []*Alert
func (as AlertSlice) Less(i, j int) bool {
// Look at labels.job, then labels.instance.
for _, overrideKey := range [...]model.LabelName{"job", "instance"} {
iVal, iOk := as[i].Labels[overrideKey]
jVal, jOk := as[j].Labels[overrideKey]
if !iOk && !jOk {
continue
}
if !iOk {
return false
}
if !jOk {
return true
}
if iVal != jVal {
return iVal < jVal
}
}
return as[i].Labels.Before(as[j].Labels)
}
func (as AlertSlice) Swap(i, j int) { as[i], as[j] = as[j], as[i] }
func (as AlertSlice) Len() int { return len(as) }
2015-10-27 17:24:09 +00:00
// Alerts turns a sequence of internal alerts into a list of
// exposable model.Alert structures.
func Alerts(alerts ...*Alert) model.Alerts {
res := make(model.Alerts, 0, len(alerts))
for _, a := range alerts {
v := a.Alert
// If the end timestamp is not reached yet, do not expose it.
if !a.Resolved() {
v.EndsAt = time.Time{}
}
res = append(res, &v)
}
return res
2015-09-25 12:38:22 +00:00
}
// Merge merges the timespan of two alerts based and overwrites annotations
// based on the authoritative timestamp. A new alert is returned, the labels
// are assumed to be equal.
2015-10-02 14:52:04 +00:00
func (a *Alert) Merge(o *Alert) *Alert {
// Let o always be the younger alert.
if o.UpdatedAt.Before(a.UpdatedAt) {
2015-10-02 14:52:04 +00:00
return o.Merge(a)
}
res := *o
// Always pick the earliest starting time.
if a.StartsAt.Before(o.StartsAt) {
res.StartsAt = a.StartsAt
}
if o.Resolved() {
// The latest explicit resolved timestamp wins if both alerts are effectively resolved.
if a.Resolved() && a.EndsAt.After(o.EndsAt) {
res.EndsAt = a.EndsAt
}
} else {
// A non-timeout timestamp always rules if it is the latest.
if a.EndsAt.After(o.EndsAt) && !a.Timeout {
res.EndsAt = a.EndsAt
}
2015-10-02 14:52:04 +00:00
}
return &res
}
2015-09-25 12:38:22 +00:00
// A Muter determines whether a given label set is muted. Implementers that
// maintain an underlying Marker are expected to update it during a call of
// Mutes.
2015-09-28 12:13:01 +00:00
type Muter interface {
2015-09-25 16:14:46 +00:00
Mutes(model.LabelSet) bool
}
// A MuteFunc is a function that implements the Muter interface.
2015-09-28 12:13:01 +00:00
type MuteFunc func(model.LabelSet) bool
// Mutes implements the Muter interface.
2015-09-28 12:13:01 +00:00
func (f MuteFunc) Mutes(lset model.LabelSet) bool { return f(lset) }
// A Silence determines whether a given label set is muted.
2015-09-25 16:14:46 +00:00
type Silence struct {
// A unique identifier across all connected instances.
2016-08-30 09:58:27 +00:00
ID string `json:"id"`
// A set of matchers determining if a label set is affect
2015-09-27 12:07:04 +00:00
// by the silence.
Matchers Matchers `json:"matchers"`
// Time range of the silence.
//
// * StartsAt must not be before creation time
// * EndsAt must be after StartsAt
// * Deleting a silence means to set EndsAt to now
// * Time range must not be modified in different ways
//
// TODO(fabxc): this may potentially be extended by
// creation and update timestamps.
StartsAt time.Time `json:"startsAt"`
EndsAt time.Time `json:"endsAt"`
2016-05-30 17:08:57 +00:00
// The last time the silence was updated.
UpdatedAt time.Time `json:"updatedAt"`
// Information about who created the silence for which reason.
CreatedBy string `json:"createdBy"`
Comment string `json:"comment,omitempty"`
2015-09-25 16:14:46 +00:00
Status SilenceStatus `json:"status"`
}
// Expired return if the silence is expired
// meaning that both StartsAt and EndsAt are equal
func (s *Silence) Expired() bool {
return s.StartsAt.Equal(s.EndsAt)
}
// SilenceStatus stores the state of a silence.
type SilenceStatus struct {
State SilenceState `json:"state"`
}
// SilenceState is used as part of SilenceStatus.
type SilenceState string
// Possible values for SilenceState.
const (
SilenceStateExpired SilenceState = "expired"
SilenceStateActive SilenceState = "active"
SilenceStatePending SilenceState = "pending"
)
// CalcSilenceState returns the SilenceState that a silence with the given start
// and end time would have right now.
func CalcSilenceState(start, end time.Time) SilenceState {
current := time.Now()
if current.Before(start) {
return SilenceStatePending
}
if current.Before(end) {
return SilenceStateActive
}
return SilenceStateExpired
2015-09-25 16:14:46 +00:00
}