|
/etc/prometheus/rules/mail_alerts.yml > mail
|
|
|
|
|
alert: PostfixMailQueueCritical
expr: node_postfix_queue_size
> 200
for: 5m
labels:
service: postfix
severity: critical
annotations:
description: Mail queue has {{ $value }} messages — possible delivery failure
summary: Postfix mail queue critical on {{ $labels.instance }}
|
alert: PostfixMailQueueGrowing
expr: node_postfix_queue_size
> 50
for: 15m
labels:
service: postfix
severity: warning
annotations:
description: 'Mail queue has {{ $value }} messages (threshold: 50)'
summary: Postfix mail queue growing on {{ $labels.instance }}
|
|
/etc/prometheus/rules/system_alerts.yml > system
|
alert: ServerDown
expr: up == 0
for: 1m
labels:
severity: critical
annotations:
description: '{{ $labels.instance }} ({{ $labels.job }}) has been unreachable for
more than 1 minute'
summary: Instance {{ $labels.instance }} is down
| Labels |
State |
Active Since |
Value |
|
alertname="ServerDown"
instance="localhost:9093"
job="alertmanager"
severity="critical"
|
firing |
2026-04-28 18:46:47.865744121 +0000 UTC |
0 |
| Annotations |
- description
- localhost:9093 (alertmanager) has been unreachable for more than 1 minute
- summary
- Instance localhost:9093 is down
|
|
| Labels |
State |
Active Since |
Value |
|
alertname="SystemdServiceFailed"
instance="mwaponda.com"
job="node"
name="prometheus-alertmanager.service"
severity="warning"
state="failed"
type="simple"
|
firing |
2026-04-28 18:46:47.865744121 +0000 UTC |
1 |
| Annotations |
- description
- Service prometheus-alertmanager.service is in failed state
- summary
- Systemd service failed on mwaponda.com
|
|
alertname="SystemdServiceFailed"
instance="mwaponda.com"
job="node"
name="openipmi.service"
severity="warning"
state="failed"
type="forking"
|
firing |
2026-04-28 18:47:17.865744121 +0000 UTC |
1 |
| Annotations |
- description
- Service openipmi.service is in failed state
- summary
- Systemd service failed on mwaponda.com
|
|
alertname="SystemdServiceFailed"
instance="mwaponda.com"
job="node"
name="logrotate.service"
severity="warning"
state="failed"
type="oneshot"
|
firing |
2026-04-29 00:00:17.865744121 +0000 UTC |
1 |
| Annotations |
- description
- Service logrotate.service is in failed state
- summary
- Systemd service failed on mwaponda.com
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/etc/prometheus/rules/web_alerts.yml > web
|
|
|
|
|
|
|
|
|