File tree Expand file tree Collapse file tree 1 file changed +15
-1
lines changed
operations/observability/mixins/workspace/rules/components/ws-daemon Expand file tree Collapse file tree 1 file changed +15
-1
lines changed Original file line number Diff line number Diff line change 12
12
{
13
13
alert: 'GitpodWsDaemonCrashLooping' ,
14
14
labels: {
15
- severity: 'critical ' ,
15
+ severity: 'warning ' ,
16
16
},
17
17
annotations: {
18
18
runbook_url: 'https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodWsDaemonCrashLooping.md' ,
23
23
increase(kube_pod_container_status_restarts_total{container="ws-daemon"}[10m]) > 0
24
24
||| ,
25
25
},
26
+ {
27
+ alert: 'BackupFailureBecauseOfGitpodWsDaemonCrash' ,
28
+ labels: {
29
+ severity: 'critical' ,
30
+ },
31
+ annotations: {
32
+ runbook_url: 'https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodWsDaemonCrashLooping.md' ,
33
+ summary: 'Increase the number of backup failure because of ws-daemon is crashlooping.' ,
34
+ description: 'Pod {{ $labels.namespace }}/{{ $labels.pod }} ({{ $labels.container }}) is restarting {{ printf "%.2f" $value }} times / 10 minutes.' ,
35
+ },
36
+ expr: |||
37
+ sum(increase(kube_pod_container_status_restarts_total{container="ws-daemon"}[10m])) > 0 AND sum(increase(gitpod_ws_manager_workspace_backups_failure_total{type="REGULAR"}[10m])) > 0
38
+ ||| ,
39
+ },
26
40
{
27
41
alert: 'GitpodWsDaemonExcessiveGC' ,
28
42
labels: {
You can’t perform that action at this time.
0 commit comments