|
/etc/prometheus/alerts/alert_healthchecks.yml > Selfmonitoring
|
| Labels |
State |
Active Since |
Value |
|
alertname="SelfMonitoringAlwaysFiring"
application="leonard_healthchecks"
severity="info"
|
firing |
2025-09-18 19:15:46.797458603 +0000 UTC |
13 |
|
|
/etc/prometheus/alerts/alert_loadbalancing.yml > lowpref
|
| Labels |
State |
Active Since |
Value |
|
alertname="LowGatewayPreference"
instance="gw06n01"
job="json_gwpref"
segment="1"
severity="page"
|
pending |
2025-12-10 11:33:10.619007883 +0000 UTC |
-48 |
| Annotations |
- summary
- has low gateway preference (-48)
|
|
alertname="LowGatewayPreference"
instance="gw04n06"
job="json_gwpref"
segment="1"
severity="page"
|
pending |
2025-12-10 15:45:25.619007883 +0000 UTC |
5 |
| Annotations |
- summary
- has low gateway preference (5)
|
|
|
/etc/prometheus/alerts/blackbox-exporter.yml > BlackboxExporter
|
alert: BlackboxProbeFailed
expr: probe_success
== 0
for: 15m
labels:
severity: critical
annotations:
description: |-
Probe failed
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Blackbox probe failed (instance {{ $labels.instance }})
| Labels |
State |
Active Since |
Value |
|
alertname="BlackboxProbeFailed"
instance="https://freifunk-router-ist-veraltet.de"
job="blackbox_tls"
severity="critical"
|
pending |
2025-12-10 17:13:16.497484307 +0000 UTC |
0 |
| Annotations |
- description
- Probe failed
VALUE = 0
LABELS = map[__name__:probe_success instance:https://freifunk-router-ist-veraltet.de job:blackbox_tls]
- summary
- Blackbox probe failed (instance https://freifunk-router-ist-veraltet.de)
|
|
alertname="BlackboxProbeFailed"
instance="https://maillist.freifunk-stuttgart.de"
job="blackbox_tls"
severity="critical"
|
pending |
2025-12-10 17:11:46.497484307 +0000 UTC |
0 |
| Annotations |
- description
- Probe failed
VALUE = 0
LABELS = map[__name__:probe_success instance:https://maillist.freifunk-stuttgart.de job:blackbox_tls]
- summary
- Blackbox probe failed (instance https://maillist.freifunk-stuttgart.de)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/etc/prometheus/alerts/general.yml > general
|
| Labels |
State |
Active Since |
Value |
|
alertname="PROBE_FAILED_TCP"
instance="https://freifunk-router-ist-veraltet.de"
job="blackbox_tls"
severity="warning"
|
pending |
2025-12-10 17:13:18.333717053 +0000 UTC |
0 |
| Annotations |
- summary
- Blackbox probe failed
|
|
alertname="PROBE_FAILED_TCP"
instance="https://maillist.freifunk-stuttgart.de"
job="blackbox_tls"
severity="warning"
|
pending |
2025-12-10 17:11:48.333717053 +0000 UTC |
0 |
| Annotations |
- summary
- Blackbox probe failed
|
|
|
|
|
|
|
|
|
|
|
/etc/prometheus/alerts/node-exporter.yml > NodeExporter
|
| Labels |
State |
Active Since |
Value |
|
alertname="HostRequiresReboot"
instance="ffs13"
job="node"
nodename="ffs13"
severity="info"
|
firing |
2025-10-28 05:48:02.079934382 +0000 UTC |
1 |
| Annotations |
- description
- ffs13 requires a reboot.
VALUE = 1
LABELS = map[instance:ffs13 job:node nodename:ffs13]
- summary
- Host requires reboot (instance ffs13)
|
|
alertname="HostRequiresReboot"
instance="ffs10"
job="node"
nodename="ffs10"
severity="info"
|
firing |
2025-11-18 05:15:02.079934382 +0000 UTC |
1 |
| Annotations |
- description
- ffs10 requires a reboot.
VALUE = 1
LABELS = map[instance:ffs10 job:node nodename:ffs10]
- summary
- Host requires reboot (instance ffs10)
|
|
alertname="HostRequiresReboot"
instance="prometheus01"
job="node"
nodename="prometheus01"
severity="info"
|
firing |
2025-11-20 20:44:17.079934382 +0000 UTC |
1 |
| Annotations |
- description
- prometheus01 requires a reboot.
VALUE = 1
LABELS = map[instance:prometheus01 job:node nodename:prometheus01]
- summary
- Host requires reboot (instance prometheus01)
|
|
alertname="HostRequiresReboot"
instance="ffs14"
job="node"
nodename="ffs14"
severity="info"
|
firing |
2025-11-13 05:19:32.079934382 +0000 UTC |
1 |
| Annotations |
- description
- ffs14 requires a reboot.
VALUE = 1
LABELS = map[instance:ffs14 job:node nodename:ffs14]
- summary
- Host requires reboot (instance ffs14)
|
|
alertname="HostRequiresReboot"
instance="monitor02"
job="node"
nodename="monitor02"
severity="info"
|
firing |
2025-11-13 05:31:32.079934382 +0000 UTC |
1 |
| Annotations |
- description
- monitor02 requires a reboot.
VALUE = 1
LABELS = map[instance:monitor02 job:node nodename:monitor02]
- summary
- Host requires reboot (instance monitor02)
|
|
alertname="HostRequiresReboot"
instance="monitor01"
job="node"
nodename="monitor01"
severity="info"
|
firing |
2025-11-13 06:06:17.079934382 +0000 UTC |
1 |
| Annotations |
- description
- monitor01 requires a reboot.
VALUE = 1
LABELS = map[instance:monitor01 job:node nodename:monitor01]
- summary
- Host requires reboot (instance monitor01)
|
|
alertname="HostRequiresReboot"
instance="ffs11"
job="node"
nodename="ffs11"
severity="info"
|
firing |
2025-11-26 06:35:32.079934382 +0000 UTC |
1 |
| Annotations |
- description
- ffs11 requires a reboot.
VALUE = 1
LABELS = map[instance:ffs11 job:node nodename:ffs11]
- summary
- Host requires reboot (instance ffs11)
|
|
alertname="HostRequiresReboot"
instance="ffs08"
job="node"
nodename="ffs08"
severity="info"
|
firing |
2025-10-28 05:33:02.079934382 +0000 UTC |
1 |
| Annotations |
- description
- ffs08 requires a reboot.
VALUE = 1
LABELS = map[instance:ffs08 job:node nodename:ffs08]
- summary
- Host requires reboot (instance ffs08)
|
|
alertname="HostRequiresReboot"
instance="ffs05"
job="node"
nodename="ffs05"
severity="info"
|
firing |
2025-11-02 14:18:02.079934382 +0000 UTC |
1 |
| Annotations |
- description
- ffs05 requires a reboot.
VALUE = 1
LABELS = map[instance:ffs05 job:node nodename:ffs05]
- summary
- Host requires reboot (instance ffs05)
|
|
alertname="HostRequiresReboot"
instance="gw04n05"
job="node"
nodename="gw04n05"
severity="info"
|
firing |
2025-12-09 08:54:32.079934382 +0000 UTC |
1 |
| Annotations |
- description
- gw04n05 requires a reboot.
VALUE = 1
LABELS = map[instance:gw04n05 job:node nodename:gw04n05]
- summary
- Host requires reboot (instance gw04n05)
|
|
alertname="HostRequiresReboot"
instance="gw09n04"
job="node"
nodename="gw09n04"
severity="info"
|
firing |
2025-11-13 05:59:02.079934382 +0000 UTC |
1 |
| Annotations |
- description
- gw09n04 requires a reboot.
VALUE = 1
LABELS = map[instance:gw09n04 job:node nodename:gw09n04]
- summary
- Host requires reboot (instance gw09n04)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
alert: HostFilesystemDeviceError
expr: node_filesystem_device_error
== 1
for: 2m
labels:
severity: critical
annotations:
description: |-
{{ $labels.instance }}: Device error with the {{ $labels.mountpoint }} filesystem
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Host filesystem device error (instance {{ $labels.instance }})
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/etc/prometheus/alerts/postfix.yml > postfix_smtp_status_deferred
|
|
|
|
/etc/prometheus/alerts/pve.yml > pve-guest-alerts
|
|
|
|
|
|
/etc/prometheus/alerts/smartctl-exporter.yml > SmartctlExporter
|
alert: SmartCriticalWarning
expr: smartctl_device_critical_warning
> 0
for: 15m
labels:
severity: critical
annotations:
description: |-
device has critical warning (instance {{ $labels.instance }})
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Smart critical warning (instance {{ $labels.instance }})
|
alert: SmartDeviceTemperatureCritical
expr: smartctl_device_temperature
> 80
for: 2m
labels:
severity: critical
annotations:
description: |-
Device temperature critical (instance {{ $labels.instance }})
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Smart device temperature critical (instance {{ $labels.instance }})
|
alert: SmartDeviceTemperatureWarning
expr: smartctl_device_temperature
> 60
for: 2m
labels:
severity: warning
annotations:
description: |-
Device temperature warning (instance {{ $labels.instance }})
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Smart device temperature warning (instance {{ $labels.instance }})
|
alert: SmartMediaErrors
expr: smartctl_device_media_errors
> 0
for: 15m
labels:
severity: critical
annotations:
description: |-
device has media errors (instance {{ $labels.instance }})
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Smart media errors (instance {{ $labels.instance }})
|
|
|