diff --git a/roles/nagios_client/tasks/main.yml b/roles/nagios_client/tasks/main.yml index 609130cd62..ed31059ee4 100644 --- a/roles/nagios_client/tasks/main.yml +++ b/roles/nagios_client/tasks/main.yml @@ -98,6 +98,10 @@ - check_datanommer_history.cfg - check_memcache.cfg - check_lock_file_age.cfg + - check_koschei_polling_proc.cfg + - check_koschei_resolver_proc.cfg + - check_koschei_scheduler_proc.cfg + - check_koschei_watcher_proc.cfg notify: - restart nrpe tags: diff --git a/roles/nagios_client/templates/check_koschei_polling_proc.cfg.j2 b/roles/nagios_client/templates/check_koschei_polling_proc.cfg.j2 new file mode 100644 index 0000000000..d71f83a92c --- /dev/null +++ b/roles/nagios_client/templates/check_koschei_polling_proc.cfg.j2 @@ -0,0 +1 @@ +command[check_koschei_polling_proc]={{ libdir }}/nagios/plugins/check_procs -s RSD -u koschei -C koschei-polling -c 1:1 diff --git a/roles/nagios_client/templates/check_koschei_resolver_proc.cfg.j2 b/roles/nagios_client/templates/check_koschei_resolver_proc.cfg.j2 new file mode 100644 index 0000000000..026d60641a --- /dev/null +++ b/roles/nagios_client/templates/check_koschei_resolver_proc.cfg.j2 @@ -0,0 +1 @@ +command[check_koschei_resolver_proc]={{ libdir }}/nagios/plugins/check_procs -s RSD -u koschei -C koschei-resolver -c 1:1 diff --git a/roles/nagios_client/templates/check_koschei_scheduler_proc.cfg.j2 b/roles/nagios_client/templates/check_koschei_scheduler_proc.cfg.j2 new file mode 100644 index 0000000000..a1c4a02b10 --- /dev/null +++ b/roles/nagios_client/templates/check_koschei_scheduler_proc.cfg.j2 @@ -0,0 +1 @@ +command[check_koschei_scheduler_proc]={{ libdir }}/nagios/plugins/check_procs -s RSD -u koschei -C koschei-scheduler -c 1:1 diff --git a/roles/nagios_client/templates/check_koschei_watcher_proc.cfg.j2 b/roles/nagios_client/templates/check_koschei_watcher_proc.cfg.j2 new file mode 100644 index 0000000000..620ab4b574 --- /dev/null +++ b/roles/nagios_client/templates/check_koschei_watcher_proc.cfg.j2 @@ -0,0 +1 @@ +command[check_koschei_watcher_proc]={{ libdir }}/nagios/plugins/check_procs -s RSD -u koschei -C koschei-watcher -c 1:1 diff --git a/roles/nagios_server/files/nagios/services/koschei.cfg b/roles/nagios_server/files/nagios/services/koschei.cfg new file mode 100644 index 0000000000..6393a26e65 --- /dev/null +++ b/roles/nagios_server/files/nagios/services/koschei.cfg @@ -0,0 +1,27 @@ +define service { + host_name koschei01 + service_description koschei-polling process + check_command check_by_nrpe!check_koschei_polling_proc + use defaulttemplate +} + +define service { + host_name koschei01 + service_description koschei-resolver process + check_command check_by_nrpe!check_koschei_resolver_proc + use defaulttemplate +} + +define service { + host_name koschei01 + service_description koschei-scheduler process + check_command check_by_nrpe!check_koschei_scheduler_proc + use defaulttemplate +} + +define service { + host_name koschei01 + service_description koschei-watcher process + check_command check_by_nrpe!check_koschei_watcher_proc + use defaulttemplate +} diff --git a/roles/nagios_server/files/nrpe.cfg b/roles/nagios_server/files/nrpe.cfg index 82e35857d0..e85b92ff26 100644 --- a/roles/nagios_server/files/nrpe.cfg +++ b/roles/nagios_server/files/nrpe.cfg @@ -239,6 +239,10 @@ command[check_redis_proc]=/usr/lib64/nagios/plugins/check_procs -c 1:1 -C 'redis command[check_openvpn_link]=/usr/lib64/nagios/plugins/check_ping -H 192.168.1.58 -w 375.0,20% -c 500,60% command[check_memcache]=/usr/lib64/nagios/plugins/check_procs -c 1:1 -a '/usr/bin/memcached' -u memcached command[check_memcache_connect]=/usr/lib64/nagios/plugins/check_memcache_connect +command[check_koschei_polling_proc]=/usr/lib64/nagios/plugins/check_procs -s RSD -u koschei -C koschei-polling -c 1:1 +command[check_koschei_resolver_proc]=/usr/lib64/nagios/plugins/check_procs -s RSD -u koschei -C koschei-resolver -c 1:1 +command[check_koschei_scheduler_proc]=/usr/lib64/nagios/plugins/check_procs -s RSD -u koschei -C koschei-scheduler -c 1:1 +command[check_koschei_watcher_proc]=/usr/lib64/nagios/plugins/check_procs -s RSD -u koschei -C koschei-watcher -c 1:1 # The following are fedmsg/datanommer checks to be run on busgateway01. # They check for the time since the latest message in any particular category.