@@ -11,31 +11,31 @@ groups:
11
11
team: infra
12
12
annotations:
13
13
summary: "AZ {{ $labels.zone}} is running out of memory for pods"
14
- dashboard: " https://grafana.$ENVIRONMENT.$PROVIDER.uw.systems/d/Mig_eDNVz/kubernetes-cluster-utilization"
14
+ dashboard: < https://grafana.$ENVIRONMENT.$PROVIDER.uw.systems/d/Mig_eDNVz/kubernetes-cluster-utilization"|link>
15
15
- alert: AvailabilityZoneRunningOutOfMemory99for10m
16
16
expr: avg(node_memory_working_set_bytes/on(node)(kube_node_status_capacity{resource="memory"} - on (node) node_eviction_threshold) * on(node) group_left(zone) kube_node_labels{role="worker"}) by (zone) > 0.99
17
17
for: 10m
18
18
labels:
19
19
team: infra
20
20
annotations:
21
21
summary: "AZ {{ $labels.zone}} is running out of memory for pods"
22
- dashboard: " https://grafana.$ENVIRONMENT.$PROVIDER.uw.systems/d/Mig_eDNVz/kubernetes-cluster-utilization"
22
+ dashboard: < https://grafana.$ENVIRONMENT.$PROVIDER.uw.systems/d/Mig_eDNVz/kubernetes-cluster-utilization|link>
23
23
- alert: AvailabilityZoneRunningOutOfMemory95for1h
24
24
expr: avg(node_memory_working_set_bytes/on(node)(kube_node_status_capacity{resource="memory"} - on (node) node_eviction_threshold) * on(node) group_left(zone) kube_node_labels{role="worker"}) by (zone) > 0.95
25
25
for: 1h
26
26
labels:
27
27
team: infra
28
28
annotations:
29
29
summary: "AZ {{ $labels.zone}} is running out of memory for pods"
30
- dashboard: " https://grafana.$ENVIRONMENT.$PROVIDER.uw.systems/d/Mig_eDNVz/kubernetes-cluster-utilization"
30
+ dashboard: < https://grafana.$ENVIRONMENT.$PROVIDER.uw.systems/d/Mig_eDNVz/kubernetes-cluster-utilization|link>
31
31
- alert: AvailabilityZoneRunningOutOfMemory99for1h
32
32
expr: avg(node_memory_working_set_bytes/on(node)(kube_node_status_capacity{resource="memory"} - on (node) node_eviction_threshold) * on(node) group_left(zone) kube_node_labels{role="worker"}) by (zone) > 0.99
33
33
for: 1h
34
34
labels:
35
35
team: infra
36
36
annotations:
37
37
summary: "AZ {{ $labels.zone}} is running out of memory for pods"
38
- dashboard: " https://grafana.$ENVIRONMENT.$PROVIDER.uw.systems/d/Mig_eDNVz/kubernetes-cluster-utilization"
38
+ dashboard: < https://grafana.$ENVIRONMENT.$PROVIDER.uw.systems/d/Mig_eDNVz/kubernetes-cluster-utilization|link>
39
39
- alert: NodeUnderMemoryPressure
40
40
expr: kube_node_status_condition{condition="MemoryPressure",status="true"} == 1
41
41
for: 5m
0 commit comments