2015-10-04 18:56:26 +02:00
|
|
|
#!/usr/bin/env python2.7
|
2013-02-19 18:06:25 +01:00
|
|
|
|
2016-03-10 17:15:34 +01:00
|
|
|
from __future__ import print_function
|
2013-02-19 18:06:25 +01:00
|
|
|
import sys
|
|
|
|
import re
|
|
|
|
import time
|
2013-10-28 15:54:32 +01:00
|
|
|
import os
|
2013-11-08 22:45:20 +01:00
|
|
|
import subprocess
|
2013-02-19 02:36:59 +01:00
|
|
|
|
2014-08-12 12:41:26 +02:00
|
|
|
WARN_THRESHOLD_DEFAULT = 10
|
|
|
|
WARN_THRESHOLD = {
|
|
|
|
'missedmessage_emails': 45,
|
|
|
|
}
|
|
|
|
CRIT_THRESHOLD_DEFAULT = 50
|
|
|
|
CRIT_THRESHOLD = {
|
|
|
|
'missedmessage_emails': 70,
|
|
|
|
}
|
2013-02-19 18:06:25 +01:00
|
|
|
|
|
|
|
states = {
|
|
|
|
0: "OK",
|
|
|
|
1: "WARNING",
|
|
|
|
2: "CRITICAL",
|
|
|
|
3: "UNKNOWN"
|
|
|
|
}
|
|
|
|
|
|
|
|
re = re.compile(r'(\w+)\t(\d+)')
|
2013-11-08 22:45:20 +01:00
|
|
|
output = subprocess.check_output(['/usr/sbin/rabbitmqctl', 'list_queues'], shell=False)
|
2013-02-19 18:06:25 +01:00
|
|
|
|
|
|
|
status = 0
|
|
|
|
max_count = 0
|
|
|
|
warn_queues = []
|
|
|
|
|
2013-10-28 15:54:32 +01:00
|
|
|
if 'USER' in os.environ and not os.environ['USER'] in ['root', 'rabbitmq']:
|
2016-03-10 17:15:34 +01:00
|
|
|
print("This script must be run as the root or rabbitmq user")
|
2013-03-19 20:04:28 +01:00
|
|
|
|
2013-02-19 18:06:25 +01:00
|
|
|
for line in output.split("\n"):
|
|
|
|
line = line.strip()
|
|
|
|
m = re.match(line)
|
|
|
|
if m:
|
|
|
|
queue = m.group(1)
|
|
|
|
count = int(m.group(2))
|
|
|
|
this_status = 0
|
2014-08-12 12:41:26 +02:00
|
|
|
if count > CRIT_THRESHOLD.get(queue, CRIT_THRESHOLD_DEFAULT):
|
2013-02-19 18:06:25 +01:00
|
|
|
this_status = 2
|
|
|
|
warn_queues.append(queue)
|
2014-08-12 12:41:26 +02:00
|
|
|
elif count > WARN_THRESHOLD.get(queue, WARN_THRESHOLD_DEFAULT):
|
2013-02-19 18:06:25 +01:00
|
|
|
this_status = max(status, 1)
|
|
|
|
warn_queues.append(queue)
|
|
|
|
|
|
|
|
status = max(status, this_status)
|
|
|
|
max_count = max(max_count, count)
|
|
|
|
|
|
|
|
warn_about = ", ".join(warn_queues)
|
|
|
|
now = int(time.time())
|
2014-01-24 00:02:26 +01:00
|
|
|
now_struct = time.gmtime(now)
|
|
|
|
|
|
|
|
# While we are sending digest emails, at 11am each weekday, the mail queues can
|
|
|
|
# get backed up; don't alert on those.
|
|
|
|
if not set(warn_queues) - set(("missedmessage_emails", "digest_emails")) and \
|
2014-03-12 17:04:26 +01:00
|
|
|
now_struct.tm_hour == 15 and now_struct.tm_min < 25:
|
2014-01-24 00:02:26 +01:00
|
|
|
status = 0
|
|
|
|
print("%s|%s|%s|processing digests, not alerting on elevated mail queues" % (
|
|
|
|
now, status, states[status]))
|
|
|
|
exit(0)
|
2013-02-19 18:06:25 +01:00
|
|
|
|
|
|
|
if status > 0:
|
|
|
|
print("%s|%s|%s|max count %s, queues affected: %s" % (now, status, states[status], max_count, warn_about))
|
|
|
|
else:
|
|
|
|
print("%s|%s|%s|queues normal, max count %s" % (now, status, states[status], max_count))
|