Skip to content

Commit 4a0ebdf

Browse files
paulfantomoblitorum
authored andcommitted
docs/node-mixin: add alerts about failing RAID array
Signed-off-by: paulfantom <pawel@krupa.net.pl>
1 parent 6ad5c54 commit 4a0ebdf

File tree

1 file changed

+27
-0
lines changed

1 file changed

+27
-0
lines changed

docs/node-mixin/alerts/alerts.libsonnet

Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -248,6 +248,33 @@
248248
message: 'Clock on {{ $labels.instance }} is not synchronising. Ensure NTP is configured on this host.',
249249
},
250250
},
251+
{
252+
alert: 'NodeRAIDDegraded',
253+
expr: |||
254+
'node_md_disks_required - ignoring (state) (node_md_disks{state="active"}) > 0'
255+
||| % $._config,
256+
'for': '15m',
257+
labels: {
258+
severity: 'critical',
259+
},
260+
annotations: {
261+
summary: 'RAID Array is degraded',
262+
description: 'RAID array '{{ $labels.device }}' on {{ $labels.instance }} is in degraded state due to one or more disks failures. Number of spare drives is insufficient to fix issue automatically.',
263+
},
264+
},
265+
{
266+
alert: 'NodeRAIDDiskFailure',
267+
expr: |||
268+
node_md_disks{state="fail"} > 0
269+
||| % $._config,
270+
labels: {
271+
severity: 'warning',
272+
},
273+
annotations: {
274+
summary: 'Failed device in RAID array',
275+
description: 'At least one device in RAID array on {{ $labels.instance }} failed. Array '{{ $labels.device }}' needs attention and possibly a disk swap.',
276+
},
277+
},
251278
],
252279
},
253280
],

0 commit comments

Comments
 (0)