File tree Expand file tree Collapse file tree 3 files changed +18
-1
lines changed Expand file tree Collapse file tree 3 files changed +18
-1
lines changed Load Diff This file was deleted.
Original file line number Diff line number Diff line change @@ -2044,6 +2044,15 @@ groups:
2044
2044
query : ' kube_node_status_condition{condition="Ready",status="true"} == 0'
2045
2045
severity : critical
2046
2046
for : 10m
2047
+ - name : Kubernetes Node scheduling disabled
2048
+ summary : Kubernetes node scheduling disabled (node {{ $labels.node }})
2049
+ description : Node {{ $labels.node }} has been marked as unschedulable for more than 30 minutes.
2050
+ query : ' kube_node_spec_taint{key="node.kubernetes.io/unschedulable"} == 1'
2051
+ severity : warning
2052
+ for : 30m
2053
+ comments : |
2054
+ Kubernetes Node with disabled schedules are fine.
2055
+ This alarm can be useful to get warned if there are nodes which are longer unscheduled.
2047
2056
- name : Kubernetes Node memory pressure
2048
2057
summary : Kubernetes memory pressure (node {{ $labels.node }})
2049
2058
description : " Node {{ $labels.node }} has MemoryPressure condition"
Original file line number Diff line number Diff line change @@ -13,6 +13,15 @@ groups:
13
13
summary : Kubernetes Node ready (node {{ $labels.node }})
14
14
description : " Node {{ $labels.node }} has been unready for a long time\n VALUE = {{ $value }}\n LABELS = {{ $labels }}"
15
15
16
+ - alert : KubernetesNodeSchedulingDisabled
17
+ expr : ' kube_node_spec_taint{key="node.kubernetes.io/unschedulable"} == 1'
18
+ for : 30m
19
+ labels :
20
+ severity : warning
21
+ annotations :
22
+ summary : Kubernetes node scheduling disabled (node {{ $labels.node }})
23
+ description : " Node {{ $labels.node }} has been marked as unschedulable for more than 30 minutes.\n VALUE = {{ $value }}\n LABELS = {{ $labels }}"
24
+
16
25
- alert : KubernetesNodeMemoryPressure
17
26
expr : ' kube_node_status_condition{condition="MemoryPressure",status="true"} == 1'
18
27
for : 2m
You can’t perform that action at this time.
0 commit comments