2013-01-24 17:43:47 +01:00
|
|
|
define service {
|
2013-02-19 17:56:16 +01:00
|
|
|
use generic-service
|
|
|
|
hostgroup_name web
|
|
|
|
service_description HTTP
|
|
|
|
check_command check_http
|
|
|
|
contact_groups page_admins
|
2013-01-24 17:43:47 +01:00
|
|
|
}
|
2012-11-01 15:47:50 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
hostgroup_name all
|
|
|
|
service_description SSH
|
|
|
|
check_command check_ssh
|
2013-02-19 17:56:16 +01:00
|
|
|
contact_groups page_admins
|
2012-11-01 15:47:50 +01:00
|
|
|
}
|
2012-11-16 16:42:52 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
2012-11-21 20:21:36 +01:00
|
|
|
hostgroup_name all
|
2012-11-16 16:42:52 +01:00
|
|
|
service_description remote disk
|
|
|
|
check_command check_remote_disk!22!20%!10%!/
|
2013-02-19 17:56:16 +01:00
|
|
|
contact_groups page_admins
|
2012-11-16 16:42:52 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
2012-11-21 20:21:36 +01:00
|
|
|
hostgroup_name all
|
2012-11-16 16:42:52 +01:00
|
|
|
service_description remote load
|
|
|
|
check_command check_remote_load!22!5.0,4.0,3.0!10.0,6.0,4.0
|
2013-02-19 17:56:16 +01:00
|
|
|
contact_groups page_admins
|
2012-11-16 16:42:52 +01:00
|
|
|
}
|
2012-11-16 17:19:53 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description zephyr mirror forwarding
|
|
|
|
check_command check_zephyr_mirror_forwarding!22
|
|
|
|
host zmirror
|
|
|
|
normal_check_interval 2
|
2012-12-19 17:14:51 +01:00
|
|
|
# Note: the actual check is run via cron, so retry_check_interval
|
|
|
|
# should always equal normal_check_interval.
|
|
|
|
retry_check_interval 2
|
2012-11-16 17:19:53 +01:00
|
|
|
max_check_attempts 2
|
2013-02-19 17:56:16 +01:00
|
|
|
contact_groups page_admins
|
2012-11-16 17:19:53 +01:00
|
|
|
}
|
2012-11-16 17:20:12 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description user zephyr mirror liveness
|
|
|
|
check_command check_user_zephyr_mirror_liveness!22
|
|
|
|
host app
|
2013-01-02 22:07:52 +01:00
|
|
|
contact_groups admins
|
2012-11-16 17:20:12 +01:00
|
|
|
}
|
2012-11-21 20:17:15 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Debian update availability
|
|
|
|
check_command check_debian_packages!22
|
|
|
|
hostgroup_name all
|
2013-01-02 22:07:52 +01:00
|
|
|
contact_groups admins
|
2012-11-21 20:17:15 +01:00
|
|
|
}
|
2013-01-02 23:49:05 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check NTP time
|
|
|
|
check_command check_ntp_time!22
|
|
|
|
hostgroup_name all
|
2013-01-24 17:43:47 +01:00
|
|
|
contact_groups admins
|
2013-01-02 23:49:05 +01:00
|
|
|
}
|
2013-01-03 16:56:36 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check feedback bot
|
|
|
|
check_command check_feedback_bot!22
|
|
|
|
host bots
|
|
|
|
# Feedback isn't lost, it just isn't reported through Humbug
|
|
|
|
# if the bot is down, so don't page.
|
|
|
|
contact_groups admins
|
|
|
|
}
|
2013-01-30 16:12:15 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check send receive time
|
|
|
|
check_command check_send_receive_time!22
|
|
|
|
host staging
|
|
|
|
contact_groups admins
|
|
|
|
}
|
2013-01-30 16:14:38 +01:00
|
|
|
|
|
|
|
## check_postgres.pl services
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres autovac_freeze
|
|
|
|
check_command check_postgres!22!autovac_freeze
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres backends
|
|
|
|
check_command check_postgres!22!backends
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres connection
|
|
|
|
check_command check_postgres!22!connection
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres hitratio
|
|
|
|
check_command check_postgres!22!hitratio
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres locks
|
|
|
|
check_command check_postgres!22!locks
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres query_time
|
|
|
|
check_command check_postgres_alert_args!22!query_time!20 seconds!40 seconds
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres sequence
|
|
|
|
check_command check_postgres!22!sequence
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres timesync
|
|
|
|
check_command check_postgres!22!timesync
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres txn_idle
|
|
|
|
check_command check_postgres_alert_args!22!txn_idle!20 seconds!40 seconds
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check postgres txn_time
|
|
|
|
check_command check_postgres_alert_args!22!txn_time!20 seconds!40 seconds
|
|
|
|
host postgres
|
|
|
|
contact_groups admins
|
|
|
|
}
|
2013-01-30 15:59:41 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description process_user_activity bot
|
|
|
|
check_command check_process_user_activity!22
|
|
|
|
hostgroup_name frontends
|
|
|
|
# Activity isn't lost if this isn't running, but it is
|
|
|
|
# critical that it arrive to avoid falsely telling MIT folks
|
2013-02-19 17:44:06 +01:00
|
|
|
# their mirrors are down.
|
2013-02-11 21:47:45 +01:00
|
|
|
# This service is also responsible for active/idle
|
|
|
|
# status.
|
2013-02-19 17:56:16 +01:00
|
|
|
contact_groups page_admins
|
2013-01-30 15:59:41 +01:00
|
|
|
}
|
2013-02-05 19:17:49 +01:00
|
|
|
|
2013-04-05 23:15:08 +02:00
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description sync signups from humbug to mailchimp
|
|
|
|
check_command check_process_mailchimp_signups!22
|
|
|
|
hostgroup_name frontends
|
|
|
|
contact_groups admins
|
|
|
|
}
|
|
|
|
|
2013-02-05 19:17:49 +01:00
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description zmirror subscriptons syncing
|
|
|
|
check_command check_sync_public_streams!22
|
|
|
|
hostgroup_name zmirror
|
2013-02-19 17:56:16 +01:00
|
|
|
contact_groups page_admins
|
2013-02-05 19:17:49 +01:00
|
|
|
}
|
2013-02-19 18:06:25 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
service_description Check rabbitmq queue sizes
|
|
|
|
check_command check_rabbitmq_queues!22
|
2013-03-19 20:04:28 +01:00
|
|
|
hostgroup_name frontends
|
|
|
|
contact_groups page_admins
|
2013-02-19 18:06:25 +01:00
|
|
|
}
|
2013-02-19 21:29:38 +01:00
|
|
|
|
|
|
|
define service {
|
|
|
|
use generic-service
|
|
|
|
hostgroup_name all
|
|
|
|
service_description swap
|
|
|
|
check_command check_remote_swap!22!80%!50%
|
|
|
|
contact_groups admins
|
|
|
|
}
|