From 45eb3c0f7fdf59f7f911810cfa3eae2558a4df1d Mon Sep 17 00:00:00 2001 From: friedrich goerz Date: Wed, 14 Dec 2022 08:19:47 +0100 Subject: [PATCH] NOTICKET: abolishing nightly false positive alerts --- .../prometheus/config/prometheus/alert.rules.j2 | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/templates/prometheus/config/prometheus/alert.rules.j2 b/templates/prometheus/config/prometheus/alert.rules.j2 index 9d8f57b..1f57d5b 100644 --- a/templates/prometheus/config/prometheus/alert.rules.j2 +++ b/templates/prometheus/config/prometheus/alert.rules.j2 @@ -335,19 +335,19 @@ groups: - alert: offsite backup pending expr: | - (time() - offsite_backup_archive_started_seconds) > 27 * 3600 or - (time() - offsite_backup_archive_ended_seconds) > 27 * 3600 or - (time() - offsite_backup_transfer_started_seconds) > 27 * 3600 or - (time() - offsite_backup_transfer_ended_seconds) > 27 * 3600 or - (time() - offsite_backup_forget_started_seconds) > 27 * 3600 or - (time() - offsite_backup_forget_ended_seconds) > 27 * 3600 + (time() - offsite_backup_archive_started_seconds) > 30 * 3600 or + (time() - offsite_backup_archive_ended_seconds) > 30 * 3600 or + (time() - offsite_backup_transfer_started_seconds) > 30 * 3600 or + (time() - offsite_backup_transfer_ended_seconds) > 30 * 3600 or + (time() - offsite_backup_forget_started_seconds) > 30 * 3600 or + (time() - offsite_backup_forget_ended_seconds) > 30 * 3600 for: 1m labels: severity: critical annotations: identifier: '{{ '{{' }} $labels.instance {{ '}}' }}' - summary: "one or more offsite backup metric timestamps for Instance <{{ '{{' }} $labels.instance {{ '}}' }}> older then 27h" - description: "offsite backups older then 27h." + summary: "one or more offsite backup metric timestamps for Instance <{{ '{{' }} $labels.instance {{ '}}' }}> older then 30h" + description: "offsite backups older then 30h." - alert: offsite backup metrics unavailable expr: |