Add harmonia alerting rule
Some checks failed
Run nix flake check / flake-check (push) Has been cancelled
Some checks failed
Run nix flake check / flake-check (push) Has been cancelled
This commit is contained in:
parent
3fde3bf757
commit
0dbdee65c5
@ -147,6 +147,14 @@
|
|||||||
annotations:
|
annotations:
|
||||||
summary: "The build-flakes service on {{ $labels.instance }} has failed"
|
summary: "The build-flakes service on {{ $labels.instance }} has failed"
|
||||||
description: "The build-flakes service on {{ $labels.instance }} has failed"
|
description: "The build-flakes service on {{ $labels.instance }} has failed"
|
||||||
|
- alert: harmonia_down
|
||||||
|
expr: node_systemd_unit_state {instance="nix-cache01.home.2rjus.net:9100", name = "harmonia.service", state = "active"} == 0
|
||||||
|
for: 5m
|
||||||
|
labels:
|
||||||
|
severity: critical
|
||||||
|
annotations:
|
||||||
|
summary: "Harmonia not running on {{ $labels.instance }}"
|
||||||
|
description: "Harmonia has been down on {{ $labels.instance }} more than 5 minutes."
|
||||||
- alert: low_disk_space_nix
|
- alert: low_disk_space_nix
|
||||||
expr: node_filesystem_free_bytes{instance="nix-cache01.home.2rjus.net:9100", mountpoint="/nix"} / node_filesystem_size_bytes{instance="nix-cache01.home.2rjus.net:9100", mountpoint="/nix"} * 100 < 10
|
expr: node_filesystem_free_bytes{instance="nix-cache01.home.2rjus.net:9100", mountpoint="/nix"} / node_filesystem_size_bytes{instance="nix-cache01.home.2rjus.net:9100", mountpoint="/nix"} * 100 < 10
|
||||||
for: 5m
|
for: 5m
|
||||||
|
Loading…
x
Reference in New Issue
Block a user