feat: zfs prom rules

This commit is contained in:
auricom
2024-10-20 18:19:36 +02:00
parent de651faa82
commit e67c466866
3 changed files with 48 additions and 0 deletions

View File

@@ -0,0 +1,7 @@
---
# yaml-language-server: $schema=https://raw.githubusercontent.com/SchemaStore/schemastore/master/src/schemas/json/kustomization.json
apiVersion: kustomize.config.k8s.io/v1beta1
kind: Kustomization
namespace: monitoring
resources:
- ./zfs.yaml

View File

@@ -0,0 +1,18 @@
---
apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
name: zrepl-replication-errors
namespace: monitoring
spec:
groups:
- name: zrepl.rules
rules:
- alert: ZreplReplicationFilesystemErrors
expr: zrepl_replication_filesystem_errors > 0
for: 15m # Alert if the condition persists for 15 minutes
labels:
severity: warning
annotations:
summary: "Zrepl replication filesystem errors detected"
description: "Zrepl job {{ $labels.zrepl_job }} has encountered filesystem errors during replication."