Path: blob/main/operations/observability/mixins/meta/rules/meta-nodes.yaml
2500 views
# Copyright (c) 2022 Gitpod GmbH. All rights reserved.1# Licensed under the GNU Affero General Public License (AGPL).2# See License.AGPL.txt in the project root for license information.34apiVersion: monitoring.coreos.com/v15kind: PrometheusRule6metadata:7labels:8prometheus: k8s9role: alert-rules10name: meta-nodes-monitoring-rules11spec:12groups:13- name: meta-nodes14rules:15- alert: GitpodMetaNodeOOMKills16labels:17severity: warning18annotations:19runbook_url: https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodMetaNodeOOMKills.md20summary: A meta node is reporting OOM kills.21description: Meta node {{ $labels.instance }} is reporting {{ printf "%.2f" $value }} Out Of Memory kills in the last 10 minutes.22expr: increase(node_vmstat_oom_kill{instance=~".*meta.*"}[10m]) > 123- alert: GitpodMetaNodeCPUSaturation24labels:25severity: warning26for: 10m27annotations:28runbook_url: https://github.com/gitpod-io/runbooks/blob/main/runbooks/GitpodMetaNodeCPUSaturation.md29summary: High CPU Saturation of a meta node.30description: Meta node {{ $labels.instance }} is reporting {{ printf "%.2f" $value }}% CPU usage for more than 10 minutes.31expr: (1 - (avg by (instance) (irate(node_cpu_seconds_total{mode="idle", instance=~".*meta.*"}[2m])))) * 100 > 75323334