apiVersion: monitoring.coreos.com/v1 kind: PrometheusRule metadata: labels: prometheus: kube-prometheus-stack-prometheus # dieser name ist fest role: alert-rules # auch fest release: kube-prometheus-stack # IMPORTANT: ohne das Label wird die Rule vom PrometheusOperator nicht gefunden name: backup-minio namespace: monitoring # Rule im namespace anlegen in dem die zu ueberwachende App laeuft spec: groups: - name: "backup-minio-nsodev.rules" # ".rules" muss unbedingt im Namen enthalten sein!! rules: - alert: backup_minio_nsodev_successful for: 1m labels: severity: warning expr: nightly_backup_successful_nsodev{stage="nsodev"} > 0 # hier kommt die eigentliche Alert expression rein annotations: message: Nightly Backup of Minio NSODEV Bucket failed - alert: backup_minio_cusqa_successful for: 1m labels: severity: warning expr: nightly_backup_successful_cusqa{stage="cusqa"} > 0 # hier kommt die eigentliche Alert expression rein annotations: message: Nightly Backup of Minio CUSQA Bucket failed - alert: backup_minio_cusprod_successful for: 1m labels: severity: warning expr: nightly_backup_successful_cusprod{stage="cusprod"} > 0 # hier kommt die eigentliche Alert expression rein annotations: message: Nightly Backup of Minio CUSPROD Bucket failed - name: "minio-api.rules" # ".rules" muss unbedingt im Namen enthalten sein!! rules: - alert: api_errors for: 5m labels: severity: critical expr: sum by (server,api) (increase(minio_s3_requests_errors_total{job="minio"}[60m])) > 50 annotations: message: S3(minio) API error above threshold of 50. Plz check.