diff --git a/hosts/monitoring-3/rules.yml b/hosts/monitoring-3/rules.yml index 26d45b2..95ed038 100644 --- a/hosts/monitoring-3/rules.yml +++ b/hosts/monitoring-3/rules.yml @@ -9,13 +9,6 @@ groups: annotations: summary: "Endpoint {{ $labels.instance }} down" description: "{{ $labels.instance }} of job {{ $labels.job }} has been down for more than 1 minutes." - - alert: InstanceUptime - expr: time() - node_boot_time_seconds{job="node-exporter"} >= 7776000 - labels: - severity: warning - annotations: - summary: "Uptime of {{ $labels.instance }} more than 90 days" - description: "The last reboot of {{ $labels.instance }} was more than 90 days ago" - alert: InstanceConfigNotSync expr: nixos_current_system_is_sync{} == 0 for: 2h @@ -48,3 +41,11 @@ groups: annotations: summary: "Event instance {{ $labels.instance }} down" description: "{{ $labels.instance }} has been down for more than 2 hours." + - alert: KernelChanged + expr: nixos_current_system_kernel_is_booted_system_kernel{job="nixos-exporter"} == 0 + for: 2h + labels: + severity: warning + annotations: + summary: "Kernel of {{ $labels.instance }} changed" + description: "The Kernel {{ $labels.instance }} booted with, isn't the target Kernel. A reboot may be required."