| Rule |
State |
Error |
Last Evaluation |
Evaluation Time |
| alert: MSSQL connectivity alert
expr: up{job="prometheus-mssql-exporter"} == 0
for: 1m
labels:
severity: Critical
annotations:
summary: The service {{ $labels.job }} is unreachable or down. please check the MSSQL for further information.
|
ok
|
|
16.761s ago
|
312.4us |
| alert: compliance alert
expr: probe_success{job="compliance",namespace!="kube-system"} == 0
labels:
Notification: None
severity: warning
annotations:
summary: The service {{ $labels.job }} compliance is disabled.
|
ok
|
|
16.76s ago
|
123.1us |
| alert: compliance alert
expr: probe_success{job="compliance",namespace!="kube-system"} == 1
labels:
severity: warning
annotations:
summary: The service {{ $labels.job }} compliance is enabled.
|
ok
|
|
16.76s ago
|
111us |
| alert: KubernetesNodeReady
expr: kube_node_status_condition{condition="Ready",namespace!="kube-system",status="true"} == 0
for: 10m
labels:
severity: critical
annotations:
description: |-
Node {{ $labels.node }} has been unready for a long time
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes Node ready (instance {{ $labels.pod }})
|
ok
|
|
16.76s ago
|
197.3us |
| alert: KubernetesMemoryPressure
expr: kube_node_status_condition{condition="MemoryPressure",namespace!="kube-system",status="true"} == 1
for: 2m
labels:
severity: critical
annotations:
description: |-
{{ $labels.node }} has MemoryPressure condition
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes memory pressure (instance {{ $labels.pod }})
|
ok
|
|
16.76s ago
|
169.3us |
| alert: KubernetesDiskPressure
expr: kube_node_status_condition{condition="DiskPressure",namespace!="kube-system",status="true"} == 1
for: 2m
labels:
severity: critical
annotations:
description: |-
{{ $labels.node }} has DiskPressure condition
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes disk pressure (instance {{ $labels.pod }})
|
ok
|
|
16.76s ago
|
157.7us |
| alert: KubernetesOutOfDisk
expr: kube_node_status_condition{condition="OutOfDisk",namespace!="kube-system",status="true"} == 1
for: 2m
labels:
severity: critical
annotations:
description: |-
{{ $labels.node }} has OutOfDisk condition
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes out of disk (instance {{ $labels.pod }})
|
ok
|
|
16.76s ago
|
103.4us |
| alert: KubernetesOutOfCapacity
expr: sum by(node) ((kube_pod_status_phase{namespace!="kube-system",phase="Running"} == 1) + on(pod, namespace) group_left(node) (0 * kube_pod_info)) / sum by(node) (kube_node_status_allocatable_pods{namespace!="kube-system"}) * 100 > 90
for: 2m
labels:
severity: warning
annotations:
description: |-
{{ $labels.node }} is out of capacity
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes out of capacity (instance {{ $labels.pod }})
|
ok
|
|
16.762s ago
|
3.806ms |
| alert: KubernetesPersistentvolumeclaimPending
expr: kube_persistentvolumeclaim_status_phase{namespace!="kube-system",phase="Pending"} == 1
for: 2m
labels:
severity: warning
annotations:
description: |-
PersistentVolumeClaim {{ $labels.namespace }}/{{ $labels.persistentvolumeclaim }} is pending
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes PersistentVolumeClaim pending (instance {{ $labels.pod }})
|
ok
|
|
16.758s ago
|
414.9us |
| alert: KubernetesVolumeOutOfDiskSpace
expr: sum without(beta_kubernetes_io_arch, beta_kubernetes_io_instance_type, failure_domain_beta_kubernetes_io_region, kubernetes_azure_com_cluster, kubernetes_azure_com_node_image_version, kubernetes_azure_com_role, kubernetes_io_arch, kubernetes_io_hostname, kubernetes_io_os, kubernetes_io_role, node_kubernetes_io_instance_type, topology_kubernetes_io_region, topology_kubernetes_io_zone, failure_domain_beta_kubernetes_io_zone) (kubelet_volume_stats_available_bytes / kubelet_volume_stats_capacity_bytes * 100 < 10)
for: 2m
labels:
severity: warning
annotations:
description: |-
Volume is almost full (< 10% left)
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes Volume out of disk space (instance {{ $labels.pod }})
|
ok
|
|
16.758s ago
|
194.9us |
| alert: KubernetesPersistentvolumeError
expr: kube_persistentvolume_status_phase{job="kube-state-metrics",namespace!="kube-system",phase=~"Failed|Pending"} > 0
labels:
severity: critical
annotations:
description: |-
Persistent volume is in bad state
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes PersistentVolume error (instance {{ $labels.pod }})
|
ok
|
|
16.758s ago
|
691us |
| alert: DatabaseMaintainenceJobCountIncreased
expr: jobcount{job="prometheus-query-exporter"} > 0
for: 1m
annotations:
description: Database Maintainence Job count for database
summary: Database Maintainence Job count for database
|
ok
|
|
16.757s ago
|
81.12us |
| alert: KubernetesPodNotHealthy
expr: min_over_time(sum by(namespace, pod) (kube_pod_status_phase{namespace!="kube-system",phase=~"Pending|Unknown|Failed"})[15m:1m]) > 0
labels:
severity: critical
annotations:
description: |-
Pod has been in a non-ready state for longer than 15 minutes.
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes Pod not healthy (instance {{ $labels.pod }})
|
ok
|
|
16.758s ago
|
6.827ms |
| alert: KubernetesPodCrashLooping
expr: increase(kube_pod_container_status_restarts_total{namespace!="kube-system"}[1m]) > 3
for: 2m
labels:
severity: warning
annotations:
description: |-
Pod {{ $labels.pod }} is crash looping
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Kubernetes pod crash looping (instance {{ $labels.pod }})
|
ok
|
|
16.751s ago
|
1.669ms |
| alert: HostHighCpuLoad
expr: 100 - (avg by(instance) (rate(node_cpu_seconds_total{mode="idle"}[2m])) * 100) > 80
for: 2m
labels:
severity: warning
annotations:
description: |-
CPU load is > 80%
VALUE = {{ $value }}
LABELS = {{ $labels }}
summary: Host high CPU load (instance {{ $labels.pod }})
|
ok
|
|
16.749s ago
|
583.9us |