Skip to content

Commit

Permalink
clusterconf/monitor: add rule for stalled lxcfs loadavg
Browse files Browse the repository at this point in the history
  • Loading branch information
aither64 committed Jul 1, 2023
1 parent f07fc16 commit 936e0e3
Showing 1 changed file with 20 additions and 0 deletions.
20 changes: 20 additions & 0 deletions modules/clusterconf/monitor/rules/nodes.nix
Original file line number Diff line number Diff line change
Expand Up @@ -861,6 +861,26 @@
'';
};
}

{
alert = "LxcfsLoadavgStalled";
expr = ''sum by (instance) (osctl_container_load1{job="nodes",role="hypervisor"}) == sum by (instance) (osctl_container_load1{job="nodes",role="hypervisor"} offset 1m)'';
for = "5m";
labels = {
alertclass = "lxcfs_loadavg";
severity = "critical";
frequency = "15m";
};
annotations = {
summary = "LXCFS loadavg is not updating (instance {{ $labels.instance }})";
description = ''
LXCFS loadavg is not updating
VALUE = {{ $value }}
LABELS: {{ $labels }}
'';
};
}
];
}

Expand Down

0 comments on commit 936e0e3

Please sign in to comment.