|
/etc/alerts.d/node_alerting_rules.yml > container_cpu_usage_is_high
|
| Labels |
State |
Active Since |
Value |
|
alertname="POD_CPU_IS_HIGH"
container="alpha"
namespace="ssd-june"
pod="dgraph-0"
severity="critical"
|
firing |
2025-12-06 11:01:39.87619941 +0000 UTC |
415.44198955904835 |
| Annotations |
- description
- Container alpha CPU usage inside POD dgraph-0 is high in ssd-june
- summary
- POD dgraph-0 CPU Usage is high in ssd-june
|
|
|
/etc/alerts.d/node_alerting_rules.yml > container_memory_usage_is_high
|
| Labels |
State |
Active Since |
Value |
|
alertname="POD_MEMORY_USAGE_IS_HIGH"
container="minio"
namespace="redica-sep"
pod="ssd-minio-6d9ddbcc9b-lnc6d"
severity="critical"
|
firing |
2025-12-01 18:14:29.308708883 +0000 UTC |
90.24861653645834 |
| Annotations |
- description
- Container Memory usage is above 80%
VALUE = 90.24861653645834
LABELS = map[container:minio namespace:redica-sep pod:ssd-minio-6d9ddbcc9b-lnc6d]
- summary
- Container minio Memory usage inside POD ssd-minio-6d9ddbcc9b-lnc6d is high in redica-sep
|
|
alertname="POD_MEMORY_USAGE_IS_HIGH"
container="minio"
namespace="ssd-june"
pod="ssd-minio-6d9ddbcc9b-46lw8"
severity="critical"
|
firing |
2025-11-02 11:11:29.308708883 +0000 UTC |
96.99605305989584 |
| Annotations |
- description
- Container Memory usage is above 80%
VALUE = 96.99605305989584
LABELS = map[container:minio namespace:ssd-june pod:ssd-minio-6d9ddbcc9b-46lw8]
- summary
- Container minio Memory usage inside POD ssd-minio-6d9ddbcc9b-46lw8 is high in ssd-june
|
|
|
/etc/alerts.d/node_alerting_rules.yml > node_cpu_greater_than_80
|
|
|
|
/etc/alerts.d/node_alerting_rules.yml > node_disk_space_too_low
|
|
|
|
/etc/alerts.d/node_alerting_rules.yml > node_down
|
alert: NODE_DOWN
expr: up{component="kubernetes-nodes"} == 0
for: 3m
labels:
severity: warning
annotations:
description: '{{ $labels.job }} job failed to scrape instance {{ $labels.instance }} for more than 3 minutes. Node Seems to be down'
summary: Node {{ $labels.kubernetes_node }} is down
|
|
/etc/alerts.d/node_alerting_rules.yml > node_memory_left_lessser_than_10
|
|
|
|
/etc/alerts.d/node_alerting_rules.yml > prometheus-job-down
|
alert: prometheus-job-down
expr: up{job="prometheus"} == 0
for: 1m
labels:
severity: warning
annotations:
description: Default Prometheus Job is Down LABELS = {{ $labels }}
summary: The Default Prometheus Job is Down (job {{ $labels.job}})
|