|
/etc/prometheus/rules/mail_alerts.yml > mail
|
|
|
|
|
alert: PostfixMailQueueCritical
expr: node_postfix_queue_size
> 200
for: 5m
labels:
service: postfix
severity: critical
annotations:
description: Mail queue has {{ $value }} messages — possible delivery failure
summary: Postfix mail queue critical on {{ $labels.instance }}
|
alert: PostfixMailQueueGrowing
expr: node_postfix_queue_size
> 50
for: 15m
labels:
service: postfix
severity: warning
annotations:
description: 'Mail queue has {{ $value }} messages (threshold: 50)'
summary: Postfix mail queue growing on {{ $labels.instance }}
|
|
/etc/prometheus/rules/system_alerts.yml > system
|
| Labels |
State |
Active Since |
Value |
|
alertname="DiskSpaceCritical"
device="/dev/sda1"
fstype="ext4"
instance="zagaavipato.services"
job="node"
mountpoint="/"
severity="critical"
|
firing |
2026-06-18 08:00:17.865744121 +0000 UTC |
90.41471283834152 |
| Annotations |
- description
- Disk / is 90.4% full
- summary
- Critical disk space on zagaavipato.services
|
|
| Labels |
State |
Active Since |
Value |
|
alertname="DiskSpaceWarning"
device="/dev/sda1"
fstype="ext4"
instance="zagaavipato.services"
job="node"
mountpoint="/"
severity="warning"
|
firing |
2026-06-05 09:57:17.865744121 +0000 UTC |
90.41471283834152 |
| Annotations |
- description
- Disk / is 90.4% full
- summary
- Disk space warning on zagaavipato.services
|
|
alertname="DiskSpaceWarning"
device="/dev/sdc"
fstype="ext4"
instance="zagaavipato.services"
job="node"
mountpoint="/backup"
severity="warning"
|
firing |
2026-06-05 09:57:17.865744121 +0000 UTC |
87.35526798855075 |
| Annotations |
- description
- Disk /backup is 87.4% full
- summary
- Disk space warning on zagaavipato.services
|
|
alert: ServerDown
expr: up == 0
for: 1m
labels:
severity: critical
annotations:
description: '{{ $labels.instance }} ({{ $labels.job }}) has been unreachable for
more than 1 minute'
summary: Instance {{ $labels.instance }} is down
| Labels |
State |
Active Since |
Value |
|
alertname="ServerDown"
instance="localhost:9093"
job="alertmanager"
severity="critical"
|
firing |
2026-06-05 09:57:17.865744121 +0000 UTC |
0 |
| Annotations |
- description
- localhost:9093 (alertmanager) has been unreachable for more than 1 minute
- summary
- Instance localhost:9093 is down
|
|
| Labels |
State |
Active Since |
Value |
|
alertname="SystemdServiceFailed"
instance="zagaavipato.services"
job="node"
name="prometheus-alertmanager.service"
severity="warning"
state="failed"
type="simple"
|
firing |
2026-06-05 09:57:17.865744121 +0000 UTC |
1 |
| Annotations |
- description
- Service prometheus-alertmanager.service is in failed state
- summary
- Systemd service failed on zagaavipato.services
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/etc/prometheus/rules/web_alerts.yml > web
|
|
|
|
|
|
|
|
|