|
/etc/config/alerting_rules.yml > BlackBox Alerts
|
|
|
|
|
|
/etc/config/alerting_rules.yml > MSSQL Alerts
|
| Labels |
State |
Active Since |
Value |
|
alertname="HostHighCpuLoad"
instance="10.0.7.37:9100"
severity="warning"
|
firing |
2025-12-10 08:42:46.936640537 +0000 UTC |
97.78809523808637 |
| Annotations |
- description
- CPU load is > 80%
VALUE = 97.78809523808637
LABELS = map[instance:10.0.7.37:9100]
- summary
- Host high CPU load (instance )
|
|
| Labels |
State |
Active Since |
Value |
|
alertname="KubernetesPodNotHealthy"
namespace="p433"
pod="ingress-nginx-controller-6fcfb6b495-rfsm4"
severity="critical"
|
firing |
2025-11-18 00:12:46.936640537 +0000 UTC |
1 |
| Annotations |
- description
- Pod has been in a non-ready state for longer than 15 minutes.
VALUE = 1
LABELS = map[namespace:p433 pod:ingress-nginx-controller-6fcfb6b495-rfsm4]
- summary
- Kubernetes Pod not healthy (instance ingress-nginx-controller-6fcfb6b495-rfsm4)
|
|
alertname="KubernetesPodNotHealthy"
namespace="p433"
pod="ingress-nginx-controller-6fcfb6b495-njd4k"
severity="critical"
|
firing |
2025-11-25 15:36:46.936640537 +0000 UTC |
1 |
| Annotations |
- description
- Pod has been in a non-ready state for longer than 15 minutes.
VALUE = 1
LABELS = map[namespace:p433 pod:ingress-nginx-controller-6fcfb6b495-njd4k]
- summary
- Kubernetes Pod not healthy (instance ingress-nginx-controller-6fcfb6b495-njd4k)
|
|
alertname="KubernetesPodNotHealthy"
namespace="p433"
pod="job-licensestatuscheck-0.0.9.228.0-8z2zh"
severity="critical"
|
firing |
2025-12-10 00:18:46.936640537 +0000 UTC |
1 |
| Annotations |
- description
- Pod has been in a non-ready state for longer than 15 minutes.
VALUE = 1
LABELS = map[namespace:p433 pod:job-licensestatuscheck-0.0.9.228.0-8z2zh]
- summary
- Kubernetes Pod not healthy (instance job-licensestatuscheck-0.0.9.228.0-8z2zh)
|
|
alertname="KubernetesPodNotHealthy"
namespace="p433"
pod="ingress-nginx-controller-6fcfb6b495-kfdjt"
severity="critical"
|
firing |
2025-11-25 15:22:46.936640537 +0000 UTC |
1 |
| Annotations |
- description
- Pod has been in a non-ready state for longer than 15 minutes.
VALUE = 1
LABELS = map[namespace:p433 pod:ingress-nginx-controller-6fcfb6b495-kfdjt]
- summary
- Kubernetes Pod not healthy (instance ingress-nginx-controller-6fcfb6b495-kfdjt)
|
|
alertname="KubernetesPodNotHealthy"
namespace="p433"
pod="ingress-nginx-controller-6fcfb6b495-gj7lz"
severity="critical"
|
firing |
2025-11-10 18:36:46.936640537 +0000 UTC |
1 |
| Annotations |
- description
- Pod has been in a non-ready state for longer than 15 minutes.
VALUE = 1
LABELS = map[namespace:p433 pod:ingress-nginx-controller-6fcfb6b495-gj7lz]
- summary
- Kubernetes Pod not healthy (instance ingress-nginx-controller-6fcfb6b495-gj7lz)
|
|
alertname="KubernetesPodNotHealthy"
namespace="p433"
pod="ingress-nginx-controller-6fcfb6b495-z95rj"
severity="critical"
|
firing |
2025-12-03 21:59:46.936640537 +0000 UTC |
1 |
| Annotations |
- description
- Pod has been in a non-ready state for longer than 15 minutes.
VALUE = 1
LABELS = map[namespace:p433 pod:ingress-nginx-controller-6fcfb6b495-z95rj]
- summary
- Kubernetes Pod not healthy (instance ingress-nginx-controller-6fcfb6b495-z95rj)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
alert: KubernetesVolumeOutOfDiskSpace
expr: sum without(beta_kubernetes_io_arch, beta_kubernetes_io_instance_type, failure_domain_beta_kubernetes_io_region, kubernetes_azure_com_cluster, kubernetes_azure_com_node_image_version, kubernetes_azure_com_role, kubernetes_io_arch, kubernetes_io_hostname, kubernetes_io_os, kubernetes_io_role, node_kubernetes_io_instance_type, topology_kubernetes_io_region, topology_kubernetes_io_zone, failure_domain_beta_kubernetes_io_zone) (kubelet_volume_stats_available_bytes / kubelet_volume_stats_capacity_bytes * 100 < 10)
for: 2m
labels:
severity: warning
annotations:
description: |-
Volume is almost full (< 10% left)
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes Volume out of disk space (instance {{ $labels.pod }})
|
|
|
|
|
|
|