|
/etc/alerts.d/node_alerting_rules.yml > container_cpu_usage_is_high
|
| Labels |
State |
Active Since |
Value |
|
alertname="POD_CPU_IS_HIGH"
container="alpha"
namespace="redica-sep-final"
pod="dgraph-0"
severity="critical"
|
firing |
2026-01-30 02:51:39.87619941 +0000 UTC |
143.80444667364236 |
| Annotations |
- description
- Container alpha CPU usage inside POD dgraph-0 is high in redica-sep-final
- summary
- POD dgraph-0 CPU Usage is high in redica-sep-final
|
|
alertname="POD_CPU_IS_HIGH"
container="alpha"
namespace="nov-striim"
pod="dgraph-0"
severity="critical"
|
firing |
2026-01-30 02:09:39.87619941 +0000 UTC |
98.73926583427757 |
| Annotations |
- description
- Container alpha CPU usage inside POD dgraph-0 is high in nov-striim
- summary
- POD dgraph-0 CPU Usage is high in nov-striim
|
|
|
/etc/alerts.d/node_alerting_rules.yml > container_memory_usage_is_high
|
|
|
|
/etc/alerts.d/node_alerting_rules.yml > node_cpu_greater_than_80
|
|
|
|
/etc/alerts.d/node_alerting_rules.yml > node_disk_space_too_low
|
|
|
|
/etc/alerts.d/node_alerting_rules.yml > node_down
|
alert: NODE_DOWN
expr: up{component="kubernetes-nodes"} == 0
for: 3m
labels:
severity: warning
annotations:
description: '{{ $labels.job }} job failed to scrape instance {{ $labels.instance }} for more than 3 minutes. Node Seems to be down'
summary: Node {{ $labels.kubernetes_node }} is down
|
|
/etc/alerts.d/node_alerting_rules.yml > node_memory_left_lessser_than_10
|
|
|
|
/etc/alerts.d/node_alerting_rules.yml > prometheus-job-down
|
alert: prometheus-job-down
expr: up{job="prometheus"} == 0
for: 1m
labels:
severity: warning
annotations:
description: Default Prometheus Job is Down LABELS = {{ $labels }}
summary: The Default Prometheus Job is Down (job {{ $labels.job}})
|