Check for connectivity to memcached.
This will attempt to call the daemon's stats command which, if broken, might hung and cause nrpe to time out. We want that, as it will give us a clue to what might be causing some other app to fail.
This commit is contained in:
parent
42e44b6e8e
commit
85c486b34b
5 changed files with 41 additions and 3 deletions
24
roles/nagios_client/files/scripts/check_memcache_connect
Normal file
24
roles/nagios_client/files/scripts/check_memcache_connect
Normal file
|
@ -0,0 +1,24 @@
|
|||
#!/bin/bash
|
||||
#
|
||||
# 2014-12-19
|
||||
# Author: Ralph Bean <rbean@redhat.com>
|
||||
|
||||
# exit codes
|
||||
ok=0
|
||||
warn=1
|
||||
crit=2
|
||||
unkn=3
|
||||
|
||||
# Right now we just check to see if we can even run this command without
|
||||
# hanging and timing out. In the future, we could parse stdout for more
|
||||
# fine-grained information.
|
||||
echo stats | nc 127.0.0.1 11211 > /dev/null
|
||||
status=$?
|
||||
|
||||
if [ $status -ne 0 ]; then
|
||||
echo "CRIT: stats command got status code $status"
|
||||
exit $crit
|
||||
else
|
||||
echo "OK: stats command got status code $status"
|
||||
exit $ok
|
||||
fi
|
|
@ -31,6 +31,7 @@
|
|||
- check_fedmsg_producers_consumers.py
|
||||
- check_supybot_plugin
|
||||
- check_datanommer_timesince.py
|
||||
- check_memcache_connect
|
||||
when: not inventory_hostname.startswith('noc')
|
||||
tags:
|
||||
- nagios_client
|
||||
|
|
|
@ -1,2 +1,2 @@
|
|||
command[check_memcache]=/usr/lib64/nagios/plugins/check_procs -c 1:1 -a '/usr/bin/memcached' -u memcached
|
||||
|
||||
command[check_memcache_connect]=/usr/lib64/nagios/plugins/check_memcache_connect
|
||||
|
|
|
@ -1,12 +1,24 @@
|
|||
define service {
|
||||
host_name memcached01
|
||||
service_description Check memcached daemon
|
||||
service_description Check for the presence of the memcached daemon
|
||||
check_command check_by_nrpe!check_memcache
|
||||
use defaulttemplate
|
||||
}
|
||||
define service {
|
||||
host_name memcached02
|
||||
service_description Check memcached daemon
|
||||
service_description Check for the presence of the memcached daemon
|
||||
check_command check_by_nrpe!check_memcache
|
||||
use defaulttemplate
|
||||
}
|
||||
define service {
|
||||
host_name memcached01
|
||||
service_description Check for connectivity to the memcached daemon
|
||||
check_command check_by_nrpe!check_memcache_connect
|
||||
use defaulttemplate
|
||||
}
|
||||
define service {
|
||||
host_name memcached02
|
||||
service_description Check for connectivity to the memcached daemon
|
||||
check_command check_by_nrpe!check_memcache_connect
|
||||
use defaulttemplate
|
||||
}
|
||||
|
|
|
@ -238,6 +238,7 @@ command[check_fcomm_queue]=/usr/lib64/nagios/plugins/check_fcomm_queue
|
|||
command[check_redis_proc]=/usr/lib64/nagios/plugins/check_procs -c 1:1 -C 'redis-server' -u redis
|
||||
command[check_openvpn_link]=/usr/lib64/nagios/plugins/check_ping -H 192.168.1.58 -w 375.0,20% -c 500,60%
|
||||
command[check_memcache]=/usr/lib64/nagios/plugins/check_procs -c 1:1 -a '/usr/bin/memcached' -u memcached
|
||||
command[check_memcache_connect]=/usr/lib64/nagios/plugins/check_memcache_connect
|
||||
|
||||
# The following are fedmsg/datanommer checks to be run on busgateway01.
|
||||
# They check for the time since the latest message in any particular category.
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue