|
/etc/prometheus/alert.rules > containers
|
| Labels |
State |
Active Since |
Value |
|
alertname="caddy_down"
severity="critical"
|
firing |
2026-02-15 23:12:06.11869088 +0000 UTC |
1 |
| Annotations |
- description
- Caddy container is down for more than 30 seconds.
- summary
- Caddy down
|
|
| Labels |
State |
Active Since |
Value |
|
alertname="graphnode_down"
severity="critical"
|
firing |
2026-02-15 23:12:06.11869088 +0000 UTC |
1 |
| Annotations |
- description
- Graph Node container is down for more than 30 seconds.
- summary
- Graph Node down
|
|
| Labels |
State |
Active Since |
Value |
|
alertname="postgres_down"
severity="critical"
|
firing |
2026-02-15 23:12:06.11869088 +0000 UTC |
1 |
| Annotations |
- description
- Postgres container is down for more than 30 seconds.
- summary
- Postgres down
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/etc/prometheus/alert.rules > host
|
alert: high_cpu_load
expr: node_load1 > 1.5
for: 30s
labels:
severity: warning
annotations:
description: Docker host is under high load, the avg load 1m is at {{ $value}}. Reported by instance {{ $labels.instance }} of job {{ $labels.job }}.
summary: Server under high load
|
|
|
|
|
|
/etc/prometheus/alert.rules > targets
|
alert: monitor_service_down
expr: up == 0
for: 30s
labels:
severity: critical
annotations:
description: Service {{ $labels.instance }} is down.
summary: Monitor service non-operational
| Labels |
State |
Active Since |
Value |
|
alertname="monitor_service_down"
instance="query-node-3:8040"
job="query-node-3"
severity="critical"
|
firing |
2026-02-15 23:12:02.878296715 +0000 UTC |
0 |
| Annotations |
- description
- Service query-node-3:8040 is down.
- summary
- Monitor service non-operational
|
|
alertname="monitor_service_down"
instance="pushgateway-l2:9091"
job="pushgateway-l2"
severity="critical"
|
firing |
2026-02-15 23:12:02.878296715 +0000 UTC |
0 |
| Annotations |
- description
- Service pushgateway-l2:9091 is down.
- summary
- Monitor service non-operational
|
|
alertname="monitor_service_down"
instance="query-node-4:8040"
job="query-node-4"
severity="critical"
|
firing |
2026-02-15 23:12:02.878296715 +0000 UTC |
0 |
| Annotations |
- description
- Service query-node-4:8040 is down.
- summary
- Monitor service non-operational
|
|
alertname="monitor_service_down"
instance="indexer-service-l2-0:7300"
job="indexer-service-l2-0"
severity="critical"
|
firing |
2026-02-15 23:12:02.878296715 +0000 UTC |
0 |
| Annotations |
- description
- Service indexer-service-l2-0:7300 is down.
- summary
- Monitor service non-operational
|
|
alertname="monitor_service_down"
instance="indexer-service-l2-1:7300"
job="indexer-service-l2-1"
severity="critical"
|
firing |
2026-02-15 23:12:02.878296715 +0000 UTC |
0 |
| Annotations |
- description
- Service indexer-service-l2-1:7300 is down.
- summary
- Monitor service non-operational
|
|
alertname="monitor_service_down"
instance="indexer-service-l2-2:7300"
job="indexer-service-l2-2"
severity="critical"
|
firing |
2026-02-15 23:12:02.878296715 +0000 UTC |
0 |
| Annotations |
- description
- Service indexer-service-l2-2:7300 is down.
- summary
- Monitor service non-operational
|
|
alertname="monitor_service_down"
instance="nodeexporter:9100"
job="nodeexporter-l2"
severity="critical"
|
firing |
2026-02-15 23:12:02.878296715 +0000 UTC |
0 |
| Annotations |
- description
- Service nodeexporter:9100 is down.
- summary
- Monitor service non-operational
|
|