Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
gitpod-io
GitHub Repository: gitpod-io/gitpod
Path: blob/main/operations/observability/mixins/workspace/rules/satellite/ws-daemon.yaml
2506 views
1
# Copyright (c) 2022 Gitpod GmbH. All rights reserved.
2
# Licensed under the GNU Affero General Public License (AGPL).
3
# See License.AGPL.txt in the project root for license information.
4
5
apiVersion: monitoring.coreos.com/v1
6
kind: PrometheusRule
7
metadata:
8
labels:
9
prometheus: k8s
10
role: alert-rules
11
name: ws-daemon-monitoring-satellite-rules
12
spec:
13
groups:
14
- name: ws-daemon
15
rules:
16
- alert: BackupFailureBecauseOfGitpodWsDaemonCrash
17
labels:
18
severity: critical
19
annotations:
20
runbook_url: https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodWsDaemonCrashLooping.md
21
summary: Increase the number of backup failure because of ws-daemon is crashlooping.
22
description: Ws-daemon is restarting {{ printf "%.2f" $value }} times / 10 minutes.
23
dashboard_url: https://grafana.gitpod.io/d/ws-daemon/gitpod-component-ws-daemon
24
expr: |
25
sum(increase(kube_pod_container_status_restarts_total{container="ws-daemon"}[10m])) by(cluster) > 0 AND sum(increase(gitpod_ws_manager_mk2_workspace_backups_failure_total{type="Regular"}[10m])) by(cluster) > 0
26
27