feat(rules): add NodeFileDescriptorLimit kernel exhaustion alert

Add a new alert when fs.file-nr is close to fs.file-max

Signed-off-by: Loic Blot <loic.blot@unix-experience.fr>
This commit is contained in:
Loïc Blot 2021-04-30 12:01:51 +02:00 committed by Loic Blot
parent 504f9b785c
commit 55ffe57cbc
No known key found for this signature in database
GPG Key ID: EFAA458E8C153987
1 changed files with 32 additions and 0 deletions

View File

@ -277,6 +277,38 @@
description: "At least one device in RAID array on {{ $labels.instance }} failed. Array '{{ $labels.device }}' needs attention and possibly a disk swap.", description: "At least one device in RAID array on {{ $labels.instance }} failed. Array '{{ $labels.device }}' needs attention and possibly a disk swap.",
}, },
}, },
{
alert: 'NodeFileDescriptorLimit',
expr: |||
(
node_filefd_allocated{job="node-exporter"} * 100 / node_filefd_maximum{job="node-exporter"} > 70
)
||| % $._config,
'for': '15m',
labels: {
severity: 'warning',
},
annotations: {
summary: 'Kernel is predicted to exhaust file descriptors limit soon.',
description: 'File descriptors limit at {{ $labels.instance }} is currently at {{ printf "%.2f" $value }}%.',
},
},
{
alert: 'NodeFileDescriptorLimit',
expr: |||
(
node_filefd_allocated{job="node-exporter"} * 100 / node_filefd_maximum{job="node-exporter"} > 90
)
||| % $._config,
'for': '15m',
labels: {
severity: 'critical',
},
annotations: {
summary: 'Kernel is predicted to exhaust file descriptors limit soon.',
description: 'File descriptors limit at {{ $labels.instance }} is currently at {{ printf "%.2f" $value }}%.',
},
},
], ],
}, },
], ],