[manual] puppet: Consolidate check_rabbitmq_*_consumers commands

This temporarily breaks the rabbitmq consumer checks for
user_activity and notify_tornado on prod.  This should be deployed in
such a way to minimize the time that the alert needs to be ignored.

(imported from commit 08fa2f0e7d78fca1346c62824573263e42339a45)
This commit is contained in:
Zev Benjamin 2013-09-23 14:58:02 -04:00
parent 6e54ca3045
commit 61ca14b400
2 changed files with 7 additions and 22 deletions

View File

@ -127,23 +127,8 @@ define command{
} }
define command{ define command{
command_name check_rabbitmq_tornado_consumers command_name check_rabbitmq_consumers
command_line /usr/lib/nagios/plugins/check_by_ssh -p $ARG1$ -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers tornado' command_line /usr/lib/nagios/plugins/check_by_ssh -p 22 -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers $ARG1$'
}
define command{
command_name check_rabbitmq_useractivity_consumers
command_line /usr/lib/nagios/plugins/check_by_ssh -p $ARG1$ -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers useractivity'
}
define command{
command_name check_rabbitmq_signups_consumers
command_line /usr/lib/nagios/plugins/check_by_ssh -p $ARG1$ -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers signups'
}
define command{
command_name check_rabbitmq_invites_consumers
command_line /usr/lib/nagios/plugins/check_by_ssh -p $ARG1$ -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers invites'
} }
define command{ define command{

View File

@ -266,7 +266,7 @@ define service {
define service { define service {
use generic-service use generic-service
service_description Check rabbitmq notify_tornado consumers service_description Check rabbitmq notify_tornado consumers
check_command check_rabbitmq_tornado_consumers!22 check_command check_rabbitmq_consumers!notify_tornado
# Workaround weird checks 40s after first error causing alerts # Workaround weird checks 40s after first error causing alerts
# from a single failure because cron hasn't run again yet # from a single failure because cron hasn't run again yet
max_check_attempts 3 max_check_attempts 3
@ -276,8 +276,8 @@ define service {
define service { define service {
use generic-service use generic-service
service_description Check rabbitmq useractivity consumers service_description Check rabbitmq user_activity consumers
check_command check_rabbitmq_useractivity_consumers!22 check_command check_rabbitmq_consumers!user_activity
# Workaround weird checks 40s after first error causing alerts # Workaround weird checks 40s after first error causing alerts
# from a single failure because cron hasn't run again yet # from a single failure because cron hasn't run again yet
max_check_attempts 3 max_check_attempts 3
@ -288,7 +288,7 @@ define service {
define service { define service {
use generic-service use generic-service
service_description Check rabbitmq invites consumers service_description Check rabbitmq invites consumers
check_command check_rabbitmq_invites_consumers!22 check_command check_rabbitmq_consumers!invites
# Workaround weird checks 40s after first error causing alerts # Workaround weird checks 40s after first error causing alerts
# from a single failure because cron hasn't run again yet # from a single failure because cron hasn't run again yet
max_check_attempts 3 max_check_attempts 3
@ -299,7 +299,7 @@ define service {
define service { define service {
use generic-service use generic-service
service_description Check rabbitmq signups consumers service_description Check rabbitmq signups consumers
check_command check_rabbitmq_signups_consumers!22 check_command check_rabbitmq_consumers!signups
# Workaround weird checks 40s after first error causing alerts # Workaround weird checks 40s after first error causing alerts
# from a single failure because cron hasn't run again yet # from a single failure because cron hasn't run again yet
max_check_attempts 3 max_check_attempts 3