diff --git a/otc/observability.t09.de/stacks/observability/victoria-k8s-stack/manifests/alerts.yaml b/otc/observability.t09.de/stacks/observability/victoria-k8s-stack/manifests/alerts.yaml index 3d2ce3f..f884bd9 100644 --- a/otc/observability.t09.de/stacks/observability/victoria-k8s-stack/manifests/alerts.yaml +++ b/otc/observability.t09.de/stacks/observability/victoria-k8s-stack/manifests/alerts.yaml @@ -1,18 +1,18 @@ apiVersion: operator.victoriametrics.com/v1beta1 kind: VMRule metadata: - name: alerting-example + name: forgejo-alerts namespace: observability spec: groups: - - name: vmalert + - name: forgejo rules: - - alert: vmalert config reload error - expr: delta(vmalert_config_last_reload_errors_total[5m]) > 0 - for: 10s + - alert: forgejo down + expr: sum by(cluster_environment) (up{pod=~"forgejo-server-.*"}) < 1 + for: 30s labels: severity: major job: "{{ $labels.job }}" annotations: value: "{{ $value }}" - description: 'error reloading vmalert config, reload count for 5 min {{ $value }}' \ No newline at end of file + description: 'forgejo is down in cluster environment {{ $labels.cluster_environment }}'