mirror of https://github.com/zulip/zulip.git
[manual] puppet: Consolidate check_rabbitmq_*_consumers commands
This temporarily breaks the rabbitmq consumer checks for user_activity and notify_tornado on prod. This should be deployed in such a way to minimize the time that the alert needs to be ignored. (imported from commit 08fa2f0e7d78fca1346c62824573263e42339a45)
This commit is contained in:
parent
6e54ca3045
commit
61ca14b400
|
@ -127,23 +127,8 @@ define command{
|
||||||
}
|
}
|
||||||
|
|
||||||
define command{
|
define command{
|
||||||
command_name check_rabbitmq_tornado_consumers
|
command_name check_rabbitmq_consumers
|
||||||
command_line /usr/lib/nagios/plugins/check_by_ssh -p $ARG1$ -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers tornado'
|
command_line /usr/lib/nagios/plugins/check_by_ssh -p 22 -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers $ARG1$'
|
||||||
}
|
|
||||||
|
|
||||||
define command{
|
|
||||||
command_name check_rabbitmq_useractivity_consumers
|
|
||||||
command_line /usr/lib/nagios/plugins/check_by_ssh -p $ARG1$ -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers useractivity'
|
|
||||||
}
|
|
||||||
|
|
||||||
define command{
|
|
||||||
command_name check_rabbitmq_signups_consumers
|
|
||||||
command_line /usr/lib/nagios/plugins/check_by_ssh -p $ARG1$ -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers signups'
|
|
||||||
}
|
|
||||||
|
|
||||||
define command{
|
|
||||||
command_name check_rabbitmq_invites_consumers
|
|
||||||
command_line /usr/lib/nagios/plugins/check_by_ssh -p $ARG1$ -l humbug -t 30 -i /var/lib/nagios/.ssh/id_rsa -H $HOSTADDRESS$ -C '/usr/lib/nagios/plugins/check_rabbitmq_consumers invites'
|
|
||||||
}
|
}
|
||||||
|
|
||||||
define command{
|
define command{
|
||||||
|
|
|
@ -266,7 +266,7 @@ define service {
|
||||||
define service {
|
define service {
|
||||||
use generic-service
|
use generic-service
|
||||||
service_description Check rabbitmq notify_tornado consumers
|
service_description Check rabbitmq notify_tornado consumers
|
||||||
check_command check_rabbitmq_tornado_consumers!22
|
check_command check_rabbitmq_consumers!notify_tornado
|
||||||
# Workaround weird checks 40s after first error causing alerts
|
# Workaround weird checks 40s after first error causing alerts
|
||||||
# from a single failure because cron hasn't run again yet
|
# from a single failure because cron hasn't run again yet
|
||||||
max_check_attempts 3
|
max_check_attempts 3
|
||||||
|
@ -276,8 +276,8 @@ define service {
|
||||||
|
|
||||||
define service {
|
define service {
|
||||||
use generic-service
|
use generic-service
|
||||||
service_description Check rabbitmq useractivity consumers
|
service_description Check rabbitmq user_activity consumers
|
||||||
check_command check_rabbitmq_useractivity_consumers!22
|
check_command check_rabbitmq_consumers!user_activity
|
||||||
# Workaround weird checks 40s after first error causing alerts
|
# Workaround weird checks 40s after first error causing alerts
|
||||||
# from a single failure because cron hasn't run again yet
|
# from a single failure because cron hasn't run again yet
|
||||||
max_check_attempts 3
|
max_check_attempts 3
|
||||||
|
@ -288,7 +288,7 @@ define service {
|
||||||
define service {
|
define service {
|
||||||
use generic-service
|
use generic-service
|
||||||
service_description Check rabbitmq invites consumers
|
service_description Check rabbitmq invites consumers
|
||||||
check_command check_rabbitmq_invites_consumers!22
|
check_command check_rabbitmq_consumers!invites
|
||||||
# Workaround weird checks 40s after first error causing alerts
|
# Workaround weird checks 40s after first error causing alerts
|
||||||
# from a single failure because cron hasn't run again yet
|
# from a single failure because cron hasn't run again yet
|
||||||
max_check_attempts 3
|
max_check_attempts 3
|
||||||
|
@ -299,7 +299,7 @@ define service {
|
||||||
define service {
|
define service {
|
||||||
use generic-service
|
use generic-service
|
||||||
service_description Check rabbitmq signups consumers
|
service_description Check rabbitmq signups consumers
|
||||||
check_command check_rabbitmq_signups_consumers!22
|
check_command check_rabbitmq_consumers!signups
|
||||||
# Workaround weird checks 40s after first error causing alerts
|
# Workaround weird checks 40s after first error causing alerts
|
||||||
# from a single failure because cron hasn't run again yet
|
# from a single failure because cron hasn't run again yet
|
||||||
max_check_attempts 3
|
max_check_attempts 3
|
||||||
|
|
Loading…
Reference in New Issue