From 953f2e5c4a2279e2f98a4e3fbcded409c1fe0053 Mon Sep 17 00:00:00 2001 From: Francois Andrieu Date: Feb 05 2023 22:52:10 +0000 Subject: ocp_monitoring: fix cronjob alert rule --- diff --git a/roles/openshift/project/templates/prometheusRules.yml b/roles/openshift/project/templates/prometheusRules.yml index dd14e2f..0d36427 100644 --- a/roles/openshift/project/templates/prometheusRules.yml +++ b/roles/openshift/project/templates/prometheusRules.yml @@ -13,7 +13,7 @@ spec: annotations: description: Latest execution of CronJob {{$labels.namespace}}/{{$labels.cronjob}} failed to complete. summary: Latest job {{$labels.cronjob}} has failed. - expr: kube_cronjob_status_last_schedule_time - kube_cronjob_status_last_successful_time > 0 + expr: (kube_cronjob_status_last_schedule_time - kube_cronjob_status_last_successful_time) * (1 - kube_cronjob_status_active) > 0 for: 5m labels: severity: warning