|
/etc/prometheus/rules/mail_alerts.yml > mail
|
|
|
|
|
alert: PostfixMailQueueCritical
expr: node_postfix_queue_size
> 200
for: 5m
labels:
service: postfix
severity: critical
annotations:
description: Mail queue has {{ $value }} messages — possible delivery failure
summary: Postfix mail queue critical on {{ $labels.instance }}
|
alert: PostfixMailQueueGrowing
expr: node_postfix_queue_size
> 50
for: 15m
labels:
service: postfix
severity: warning
annotations:
description: 'Mail queue has {{ $value }} messages (threshold: 50)'
summary: Postfix mail queue growing on {{ $labels.instance }}
|
|
/etc/prometheus/rules/system_alerts.yml > system
|
| Labels |
State |
Active Since |
Value |
|
alertname="DiskSpaceWarning"
device="/dev/sda1"
fstype="ext4"
instance="durufprocgas.com"
job="node"
mountpoint="/"
severity="warning"
|
firing |
2026-05-07 05:23:17.865744121 +0000 UTC |
84.60164854729237 |
| Annotations |
- description
- Disk / is 84.6% full
- summary
- Disk space warning on durufprocgas.com
|
|
alertname="DiskSpaceWarning"
device="/dev/sdb"
fstype="ext4"
instance="durufprocgas.com"
job="node"
mountpoint="/backup"
severity="warning"
|
firing |
2026-05-07 05:23:17.865744121 +0000 UTC |
86.2368198448894 |
| Annotations |
- description
- Disk /backup is 86.2% full
- summary
- Disk space warning on durufprocgas.com
|
|
| Labels |
State |
Active Since |
Value |
|
alertname="SystemdServiceFailed"
instance="durufprocgas.com"
job="node"
name="certbot.service"
severity="warning"
state="failed"
type="oneshot"
|
firing |
2026-05-09 12:35:17.865744121 +0000 UTC |
1 |
| Annotations |
- description
- Service certbot.service is in failed state
- summary
- Systemd service failed on durufprocgas.com
|
|
alertname="SystemdServiceFailed"
instance="durufprocgas.com"
job="node"
name="logrotate.service"
severity="warning"
state="failed"
type="oneshot"
|
firing |
2026-05-07 05:23:17.865744121 +0000 UTC |
1 |
| Annotations |
- description
- Service logrotate.service is in failed state
- summary
- Systemd service failed on durufprocgas.com
|
|
alertname="SystemdServiceFailed"
instance="durufprocgas.com"
job="node"
name="maldet.service"
severity="warning"
state="failed"
type="forking"
|
firing |
2026-05-08 06:29:47.865744121 +0000 UTC |
1 |
| Annotations |
- description
- Service maldet.service is in failed state
- summary
- Systemd service failed on durufprocgas.com
|
|
alertname="SystemdServiceFailed"
instance="durufprocgas.com"
job="node"
name="openipmi.service"
severity="warning"
state="failed"
type="forking"
|
firing |
2026-05-07 05:23:17.865744121 +0000 UTC |
1 |
| Annotations |
- description
- Service openipmi.service is in failed state
- summary
- Systemd service failed on durufprocgas.com
|
|
alertname="SystemdServiceFailed"
instance="durufprocgas.com"
job="node"
name="spamd.service"
severity="warning"
state="failed"
type="simple"
|
firing |
2026-05-07 05:23:17.865744121 +0000 UTC |
1 |
| Annotations |
- description
- Service spamd.service is in failed state
- summary
- Systemd service failed on durufprocgas.com
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
alert: ServerDown
expr: up == 0
for: 1m
labels:
severity: critical
annotations:
description: '{{ $labels.instance }} ({{ $labels.job }}) has been unreachable for
more than 1 minute'
summary: Instance {{ $labels.instance }} is down
|
|
|
|
/etc/prometheus/rules/web_alerts.yml > web
|
|
|
|
|
|
|
|
|