From f89b1fdba93b473b2cd89899db24248a22a99dc1 Mon Sep 17 00:00:00 2001 From: Pierre-Yves Chibon Date: Mar 20 2020 13:36:31 +0000 Subject: nagios: change the string checked on the status page Nagios warns us if status.fp.o isn't running, that's the goal. But nagios was checking for the presence of the string: "All systems go". This is fine, until one system goes down. Nagios tells us about this system, we go look at it, we (manually) update status.fp.o so our users know that we know about the outage. Then nagios tells us that status.fp.o isn't how it should be and we need to go tell nagios that we know status isn't how it should be since we updated it ourselves. So instead of checking for "All systems go" we'll now check for "Fedora Infrastructure Status" which is at the top of the page and will remain there as long as status.fp.o is up and regardless of the state of the rest of the infra. Signed-off-by: Pierre-Yves Chibon --- diff --git a/roles/nagios_server/templates/nagios/services/websites.cfg.j2 b/roles/nagios_server/templates/nagios/services/websites.cfg.j2 index c8958d7..61fe6ef 100644 --- a/roles/nagios_server/templates/nagios/services/websites.cfg.j2 +++ b/roles/nagios_server/templates/nagios/services/websites.cfg.j2 @@ -135,7 +135,7 @@ define service { define service { host_name status service_description http-status.fedoraproject.org - check_command check_website_ssl!www.fedorastatus.org!/index.html!All systems go + check_command check_website_ssl!www.fedorastatus.org!/index.html!Fedora Infrastructure Status use websitetemplate }