Path: blob/main/operations/observability/mixins/workspace/rules/satellite/ws-daemon.yaml
2506 views
# Copyright (c) 2022 Gitpod GmbH. All rights reserved.1# Licensed under the GNU Affero General Public License (AGPL).2# See License.AGPL.txt in the project root for license information.34apiVersion: monitoring.coreos.com/v15kind: PrometheusRule6metadata:7labels:8prometheus: k8s9role: alert-rules10name: ws-daemon-monitoring-satellite-rules11spec:12groups:13- name: ws-daemon14rules:15- alert: BackupFailureBecauseOfGitpodWsDaemonCrash16labels:17severity: critical18annotations:19runbook_url: https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodWsDaemonCrashLooping.md20summary: Increase the number of backup failure because of ws-daemon is crashlooping.21description: Ws-daemon is restarting {{ printf "%.2f" $value }} times / 10 minutes.22dashboard_url: https://grafana.gitpod.io/d/ws-daemon/gitpod-component-ws-daemon23expr: |24sum(increase(kube_pod_container_status_restarts_total{container="ws-daemon"}[10m])) by(cluster) > 0 AND sum(increase(gitpod_ws_manager_mk2_workspace_backups_failure_total{type="Regular"}[10m])) by(cluster) > 0252627