2016-12-05 19:06:34 -06:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
################################################################################
|
|
|
|
#
|
|
|
|
# Rattail -- Retail Software Framework
|
2017-07-06 23:38:50 -05:00
|
|
|
# Copyright © 2010-2017 Lance Edgar
|
2016-12-05 19:06:34 -06:00
|
|
|
#
|
|
|
|
# This file is part of Rattail.
|
|
|
|
#
|
|
|
|
# Rattail is free software: you can redistribute it and/or modify it under the
|
2017-07-06 23:38:50 -05:00
|
|
|
# terms of the GNU General Public License as published by the Free Software
|
|
|
|
# Foundation, either version 3 of the License, or (at your option) any later
|
|
|
|
# version.
|
2016-12-05 19:06:34 -06:00
|
|
|
#
|
|
|
|
# Rattail is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
|
|
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
2017-07-06 23:38:50 -05:00
|
|
|
# FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
|
|
|
|
# details.
|
2016-12-05 19:06:34 -06:00
|
|
|
#
|
2017-07-06 23:38:50 -05:00
|
|
|
# You should have received a copy of the GNU General Public License along with
|
|
|
|
# Rattail. If not, see <http://www.gnu.org/licenses/>.
|
2016-12-05 19:06:34 -06:00
|
|
|
#
|
|
|
|
################################################################################
|
|
|
|
"""
|
|
|
|
Tempmon server daemon
|
|
|
|
"""
|
|
|
|
|
|
|
|
from __future__ import unicode_literals, absolute_import
|
|
|
|
|
|
|
|
import time
|
|
|
|
import datetime
|
|
|
|
import logging
|
|
|
|
|
|
|
|
from rattail.db import Session, api
|
2016-12-05 20:59:05 -06:00
|
|
|
from rattail_tempmon.db import Session as TempmonSession, model as tempmon
|
2016-12-05 19:06:34 -06:00
|
|
|
from rattail.daemon import Daemon
|
|
|
|
from rattail.time import localtime, make_utc
|
|
|
|
from rattail.mail import send_email
|
|
|
|
|
|
|
|
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
|
|
|
class TempmonServerDaemon(Daemon):
|
|
|
|
"""
|
|
|
|
Linux daemon implementation of tempmon server.
|
|
|
|
"""
|
|
|
|
timefmt = '%Y-%m-%d %H:%M:%S'
|
|
|
|
|
|
|
|
def run(self):
|
|
|
|
"""
|
|
|
|
Keeps an eye on tempmon readings and sends alerts as needed.
|
|
|
|
"""
|
|
|
|
self.extra_emails = self.config.getlist('rattail.tempmon', 'extra_emails', default=[])
|
|
|
|
while True:
|
|
|
|
self.check_readings()
|
2016-12-05 20:59:05 -06:00
|
|
|
|
|
|
|
# TODO: make this configurable
|
|
|
|
time.sleep(60)
|
2016-12-05 19:06:34 -06:00
|
|
|
|
|
|
|
def check_readings(self):
|
|
|
|
self.now = make_utc()
|
|
|
|
session = TempmonSession()
|
2017-02-07 14:47:57 -06:00
|
|
|
|
2017-06-01 17:16:31 -05:00
|
|
|
try:
|
|
|
|
clients = session.query(tempmon.Client)\
|
|
|
|
.filter(tempmon.Client.enabled == True)
|
|
|
|
for client in clients:
|
|
|
|
self.check_readings_for_client(session, client)
|
|
|
|
except:
|
|
|
|
log.exception("Failed to check client probe readings (but will keep trying)")
|
|
|
|
session.rollback()
|
|
|
|
else:
|
|
|
|
session.commit()
|
|
|
|
finally:
|
|
|
|
session.close()
|
2016-12-05 19:06:34 -06:00
|
|
|
|
2017-02-07 14:47:57 -06:00
|
|
|
def check_readings_for_client(self, session, client):
|
|
|
|
delay = client.delay or 60
|
|
|
|
cutoff = self.now - datetime.timedelta(seconds=delay + 60)
|
2017-06-01 17:37:27 -05:00
|
|
|
online = True
|
2017-02-07 14:47:57 -06:00
|
|
|
for probe in client.enabled_probes():
|
2017-06-01 17:37:27 -05:00
|
|
|
online = online and bool(self.check_readings_for_probe(session, probe, cutoff))
|
2018-09-28 11:57:27 -05:00
|
|
|
|
|
|
|
# if client was previously marked online, but we have no "new"
|
|
|
|
# readings, then let's look closer to see if it's been long enough to
|
|
|
|
# mark it offline
|
|
|
|
if client.online and not online:
|
|
|
|
|
|
|
|
# we consider client offline if it has failed to take readings for
|
|
|
|
# 3 times in a row. allow a one minute buffer for good measure.
|
|
|
|
cutoff = self.now - datetime.timedelta(seconds=(delay * 3) + 60)
|
|
|
|
reading = session.query(tempmon.Reading)\
|
|
|
|
.filter(tempmon.Reading.client == client)\
|
|
|
|
.filter(tempmon.Reading.taken >= cutoff)\
|
|
|
|
.first()
|
|
|
|
if not reading:
|
|
|
|
log.info("marking client as OFFLINE: {}".format(client))
|
|
|
|
client.online = False
|
|
|
|
send_email(self.config, 'tempmon_client_offline', {
|
|
|
|
'client': client,
|
|
|
|
'now': localtime(self.config, self.now, from_utc=True),
|
|
|
|
})
|
2018-02-07 17:47:00 -06:00
|
|
|
|
2017-02-07 14:47:57 -06:00
|
|
|
|
|
|
|
def check_readings_for_probe(self, session, probe, cutoff):
|
|
|
|
readings = session.query(tempmon.Reading)\
|
|
|
|
.filter(tempmon.Reading.probe == probe)\
|
|
|
|
.filter(tempmon.Reading.taken >= cutoff)\
|
|
|
|
.all()
|
|
|
|
if readings:
|
|
|
|
# we really only care about the latest reading
|
|
|
|
reading = sorted(readings, key=lambda r: r.taken)[-1]
|
|
|
|
|
|
|
|
if (reading.degrees_f <= probe.critical_temp_min or
|
|
|
|
reading.degrees_f >= probe.critical_temp_max):
|
|
|
|
self.update_status(probe, self.enum.TEMPMON_PROBE_STATUS_CRITICAL_TEMP, reading)
|
2016-12-05 19:06:34 -06:00
|
|
|
|
2017-02-07 14:47:57 -06:00
|
|
|
elif reading.degrees_f < probe.good_temp_min:
|
|
|
|
self.update_status(probe, self.enum.TEMPMON_PROBE_STATUS_LOW_TEMP, reading)
|
2016-12-05 19:06:34 -06:00
|
|
|
|
2017-02-07 14:47:57 -06:00
|
|
|
elif reading.degrees_f > probe.good_temp_max:
|
|
|
|
self.update_status(probe, self.enum.TEMPMON_PROBE_STATUS_HIGH_TEMP, reading)
|
2016-12-05 19:06:34 -06:00
|
|
|
|
2017-02-07 14:47:57 -06:00
|
|
|
else: # temp is good
|
|
|
|
self.update_status(probe, self.enum.TEMPMON_PROBE_STATUS_GOOD_TEMP, reading)
|
2016-12-05 19:06:34 -06:00
|
|
|
|
2017-02-07 14:47:57 -06:00
|
|
|
else: # no readings for probe
|
|
|
|
self.update_status(probe, self.enum.TEMPMON_PROBE_STATUS_ERROR)
|
2016-12-05 19:06:34 -06:00
|
|
|
|
2017-06-01 17:16:31 -05:00
|
|
|
return readings
|
|
|
|
|
2016-12-05 19:06:34 -06:00
|
|
|
def update_status(self, probe, status, reading=None):
|
2016-12-10 23:04:42 -06:00
|
|
|
data = {
|
|
|
|
'probe': probe,
|
|
|
|
'status': self.enum.TEMPMON_PROBE_STATUS[status],
|
|
|
|
'reading': reading,
|
|
|
|
'taken': localtime(self.config, reading.taken, from_utc=True) if reading else None,
|
|
|
|
'now': localtime(self.config),
|
|
|
|
}
|
|
|
|
|
2016-12-05 19:06:34 -06:00
|
|
|
prev_status = probe.status
|
2016-12-11 10:46:53 -06:00
|
|
|
prev_alert_sent = probe.status_alert_sent
|
2016-12-05 19:06:34 -06:00
|
|
|
if probe.status != status:
|
|
|
|
probe.status = status
|
|
|
|
probe.status_changed = self.now
|
|
|
|
probe.status_alert_sent = None
|
|
|
|
|
2016-12-10 12:40:50 -06:00
|
|
|
# send email when things go back to normal, after being bad
|
2016-12-11 10:46:53 -06:00
|
|
|
if status == self.enum.TEMPMON_PROBE_STATUS_GOOD_TEMP and prev_alert_sent:
|
2016-12-10 23:04:42 -06:00
|
|
|
send_email(self.config, 'tempmon_good_temp', data)
|
2016-12-10 12:40:50 -06:00
|
|
|
probe.status_alert_sent = self.now
|
|
|
|
|
|
|
|
# no (more) email if status is good
|
2016-12-05 19:06:34 -06:00
|
|
|
if status == self.enum.TEMPMON_PROBE_STATUS_GOOD_TEMP:
|
|
|
|
return
|
|
|
|
|
|
|
|
# no email if we already sent one...until timeout is reached
|
|
|
|
if probe.status_alert_sent:
|
|
|
|
timeout = datetime.timedelta(minutes=probe.status_alert_timeout)
|
|
|
|
if (self.now - probe.status_alert_sent) <= timeout:
|
|
|
|
return
|
|
|
|
|
2016-12-10 12:40:50 -06:00
|
|
|
# delay even the first email, until configured threshold is reached
|
2018-02-07 17:45:06 -06:00
|
|
|
# unless we have a critical status
|
|
|
|
if status != self.enum.TEMPMON_PROBE_STATUS_CRITICAL_TEMP:
|
|
|
|
timeout = datetime.timedelta(minutes=probe.therm_status_timeout)
|
|
|
|
if (self.now - probe.status_changed) <= timeout:
|
|
|
|
return
|
2016-12-10 12:40:50 -06:00
|
|
|
|
2016-12-05 19:06:34 -06:00
|
|
|
msgtypes = {
|
|
|
|
self.enum.TEMPMON_PROBE_STATUS_LOW_TEMP : 'tempmon_low_temp',
|
|
|
|
self.enum.TEMPMON_PROBE_STATUS_HIGH_TEMP : 'tempmon_high_temp',
|
|
|
|
self.enum.TEMPMON_PROBE_STATUS_CRITICAL_TEMP : 'tempmon_critical_temp',
|
|
|
|
self.enum.TEMPMON_PROBE_STATUS_ERROR : 'tempmon_error',
|
|
|
|
}
|
|
|
|
|
|
|
|
send_email(self.config, msgtypes[status], data)
|
|
|
|
|
|
|
|
# maybe send more emails if config said so
|
|
|
|
for msgtype in self.extra_emails:
|
|
|
|
send_email(self.config, msgtype, data)
|
|
|
|
|
|
|
|
probe.status_alert_sent = self.now
|
|
|
|
|
|
|
|
|
|
|
|
def make_daemon(config, pidfile=None):
|
|
|
|
"""
|
|
|
|
Returns a tempmon server daemon instance.
|
|
|
|
"""
|
|
|
|
if not pidfile:
|
|
|
|
pidfile = config.get('rattail.tempmon', 'server.pid_path',
|
|
|
|
default='/var/run/rattail/tempmon-server.pid')
|
|
|
|
return TempmonServerDaemon(pidfile, config=config)
|