Merge pull request #2030 from nerzhul/patch-1

feat(rules): add NodeFileDescriptorLimit kernel exhaustion alert
This commit is contained in:
Ben Kochie 2021-07-14 13:16:58 +02:00 committed by GitHub
commit 7029c71bcf
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -277,6 +277,38 @@
description: "At least one device in RAID array on {{ $labels.instance }} failed. Array '{{ $labels.device }}' needs attention and possibly a disk swap.",
},
},
{
alert: 'NodeFileDescriptorLimit',
expr: |||
(
node_filefd_allocated{job="node-exporter"} * 100 / node_filefd_maximum{job="node-exporter"} > 70
)
||| % $._config,
'for': '15m',
labels: {
severity: 'warning',
},
annotations: {
summary: 'Kernel is predicted to exhaust file descriptors limit soon.',
description: 'File descriptors limit at {{ $labels.instance }} is currently at {{ printf "%.2f" $value }}%.',
},
},
{
alert: 'NodeFileDescriptorLimit',
expr: |||
(
node_filefd_allocated{job="node-exporter"} * 100 / node_filefd_maximum{job="node-exporter"} > 90
)
||| % $._config,
'for': '15m',
labels: {
severity: 'critical',
},
annotations: {
summary: 'Kernel is predicted to exhaust file descriptors limit soon.',
description: 'File descriptors limit at {{ $labels.instance }} is currently at {{ printf "%.2f" $value }}%.',
},
},
],
},
],