@@ -1425,15 +1425,15 @@ tests:
1425
1425
summary : " StatefulSet has not matched the expected number of replicas."
1426
1426
1427
1427
- name : KubeCPUOvercommit alert (single-node)
1428
- - interval : 1m
1428
+ interval : 1m
1429
1429
input_series :
1430
1430
- series : ' namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1431
1431
values : ' 1x10'
1432
1432
- series : ' namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1433
1433
values : ' 1x10'
1434
1434
- series : ' kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="cpu", job="kube-state-metrics"}'
1435
1435
values : ' 1.9x10' # This value was seen on a 2x vCPU node
1436
- - series : ' kube_node_info{ cluster="kubernetes", node="n1", job="kube-state-metrics "}'
1436
+ - series : ' kube_node_role{ cluster="kubernetes", node="n1", role="control-plane "}'
1437
1437
values : ' 1x10'
1438
1438
alert_rule_test :
1439
1439
- eval_time : 9m
@@ -1444,12 +1444,12 @@ tests:
1444
1444
- exp_labels :
1445
1445
severity : warning
1446
1446
exp_annotations :
1447
- description : Cluster has overcommitted CPU resource requests for Pods by 0.385 CPU shares and cannot tolerate node failure.
1447
+ description : Cluster has overcommitted CPU resource requests for Pods by 0.10000000000000009 CPU shares and cannot tolerate node failure.
1448
1448
runbook_url : https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubecpuovercommit
1449
1449
summary : Cluster has overcommitted CPU resource requests.
1450
1450
1451
1451
- name : KubeCPUOvercommit alert (multi-node)
1452
- - interval : 1m
1452
+ interval : 1m
1453
1453
input_series :
1454
1454
- series : ' namespace_cpu:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1455
1455
values : ' 2x10'
@@ -1459,9 +1459,9 @@ tests:
1459
1459
values : ' 1.9x10' # This value was seen on a 2x vCPU node
1460
1460
- series : ' kube_node_status_allocatable{cluster="kubernetes", node="n2", resource="cpu", job="kube-state-metrics"}'
1461
1461
values : ' 1.9x10'
1462
- - series : ' kube_node_info{ cluster="kubernetes", node="n1", job="kube-state-metrics "}'
1462
+ - series : ' kube_node_role{ cluster="kubernetes", node="n1", role="control-plane "}'
1463
1463
values : ' 1x10'
1464
- - series : ' kube_node_info{ cluster="kubernetes", node="n2", job="kube-state-metrics "}'
1464
+ - series : ' kube_node_role{ cluster="kubernetes", node="n2", role="control-plane "}'
1465
1465
values : ' 1x10'
1466
1466
alert_rule_test :
1467
1467
- eval_time : 9m
@@ -1472,20 +1472,20 @@ tests:
1472
1472
- exp_labels :
1473
1473
severity : warning
1474
1474
exp_annotations :
1475
- description : Cluster has overcommitted CPU resource requests for Pods by 2.1 CPU shares and cannot tolerate node failure.
1475
+ description : Cluster has overcommitted CPU resource requests for Pods by 0.20000000000000018 CPU shares and cannot tolerate node failure.
1476
1476
runbook_url : https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubecpuovercommit
1477
1477
summary : Cluster has overcommitted CPU resource requests.
1478
1478
1479
1479
- name : KubeMemoryOvercommit alert (single-node)
1480
- - interval : 1m
1480
+ interval : 1m
1481
1481
input_series :
1482
1482
- series : ' namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1483
1483
values : ' 1000000000x10' # 1 GB
1484
1484
- series : ' namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="kube-system"}'
1485
1485
values : ' 1000000000x10'
1486
1486
- series : ' kube_node_status_allocatable{cluster="kubernetes", node="n1", resource="memory", job="kube-state-metrics"}'
1487
1487
values : ' 1000000000x10'
1488
- - series : ' kube_node_info {cluster="kubernetes", node="n1", job="kube-state-metrics "}'
1488
+ - series : ' kube_node_role {cluster="kubernetes", node="n1", role="control-plane "}'
1489
1489
values : ' 1x10'
1490
1490
alert_rule_test :
1491
1491
- eval_time : 9m
@@ -1496,12 +1496,12 @@ tests:
1496
1496
- exp_labels :
1497
1497
severity : warning
1498
1498
exp_annotations :
1499
- description : Cluster has overcommitted memory resource requests for Pods by 1.15G bytes and cannot tolerate node failure.
1499
+ description : Cluster has overcommitted memory resource requests for Pods by 1G bytes and cannot tolerate node failure.
1500
1500
runbook_url : https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubememoryovercommit
1501
1501
summary : Cluster has overcommitted memory resource requests.
1502
1502
1503
1503
- name : KubeMemoryOvercommit alert (multi-node)
1504
- - interval : 1m
1504
+ interval : 1m
1505
1505
input_series :
1506
1506
- series : ' namespace_memory:kube_pod_container_resource_requests:sum{cluster="kubernetes", namespace="default"}'
1507
1507
values : ' 2000000000x10' # 2 GB
@@ -1511,9 +1511,9 @@ tests:
1511
1511
values : ' 1000000000x10'
1512
1512
- series : ' kube_node_status_allocatable{cluster="kubernetes", node="n2", resource="memory", job="kube-state-metrics"}'
1513
1513
values : ' 1000000000x10'
1514
- - series : ' kube_node_info {cluster="kubernetes", node="n1", job="kube-state-metrics "}'
1514
+ - series : ' kube_node_role {cluster="kubernetes", node="n1", role="control-plane "}'
1515
1515
values : ' 1x10'
1516
- - series : ' kube_node_info {cluster="kubernetes", node="n2", job="kube-state-metrics "}'
1516
+ - series : ' kube_node_role {cluster="kubernetes", node="n2", role="control-plane "}'
1517
1517
values : ' 1x10'
1518
1518
alert_rule_test :
1519
1519
- eval_time : 9m
@@ -1524,6 +1524,6 @@ tests:
1524
1524
- exp_labels :
1525
1525
severity : warning
1526
1526
exp_annotations :
1527
- description : Cluster has overcommitted memory resource requests for Pods by 3G bytes and cannot tolerate node failure.
1527
+ description : Cluster has overcommitted memory resource requests for Pods by 2G bytes and cannot tolerate node failure.
1528
1528
runbook_url : https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubememoryovercommit
1529
1529
summary : Cluster has overcommitted memory resource requests.
0 commit comments