Path: blob/main/operations/observability/mixins/self-hosted/rules/observability-stack/alertmanager.yaml
3611 views
# Copyright (c) 2022 Gitpod GmbH. All rights reserved.1# Licensed under the GNU Affero General Public License (AGPL).2# See License.AGPL.txt in the project root for license information.34apiVersion: monitoring.coreos.com/v15kind: PrometheusRule6metadata:7labels:8app.kubernetes.io/name: kubernetes9app.kubernetes.io/part-of: kube-prometheus10prometheus: k8s11role: alert-rules12name: alertmanager-monitoring-rules13namespace: monitoring-satellite14spec:15groups:16- name: alertmanager17rules:18- alert: AlertmanagerFailedReload19annotations:20description: Configuration has failed to load for {{ $labels.namespace }}/{{ $labels.pod}}.21summary: Reloading an Alertmanager configuration has failed.22expr: |23# Without max_over_time, failed scrapes could create false negatives, see24# https://www.robustperception.io/alerting-on-gauges-in-prometheus-2-0 for details.25max_over_time(alertmanager_config_last_reload_successful{job="alertmanager-main",namespace="monitoring-satellite"}[5m]) == 026for: 10m27labels:28severity: critical29team: delivery-operations-experience30- alert: AlertmanagerFailedToSendAlerts31annotations:32description: Alertmanager {{ $labels.namespace }}/{{ $labels.pod}} failed to send {{ $value | humanizePercentage }} of notifications to {{ $labels.integration }}.33summary: An Alertmanager instance failed to send notifications.34expr: |35(36rate(alertmanager_notifications_failed_total{job="alertmanager-main",namespace="monitoring-satellite"}[5m])37/38rate(alertmanager_notifications_total{job="alertmanager-main",namespace="monitoring-satellite"}[5m])39)40> 0.0141for: 5m42labels:43severity: warning44team: delivery-operations-experience454647