-
Notifications
You must be signed in to change notification settings - Fork 295
/
Copy pathsync_watchdog.py
40 lines (32 loc) · 1.32 KB
/
sync_watchdog.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
from tapiriik.database import db, close_connections
from tapiriik.sync import SyncStep
import os
import signal
import socket
from datetime import timedelta, datetime
print("Sync watchdog run at %s" % datetime.now())
host = socket.gethostname()
for worker in db.sync_workers.find({"Host": host}):
# Does the process still exist?
alive = True
try:
os.kill(worker["Process"], 0)
except os.error:
print("%s is no longer alive" % worker)
alive = False
# Has it been stalled for too long?
if worker["State"] == SyncStep.List:
timeout = timedelta(minutes=45) # This can take a loooooooong time
else:
timeout = timedelta(minutes=10) # But everything else shouldn't
if alive and worker["Heartbeat"] < datetime.utcnow() - timeout:
print("%s timed out" % worker)
os.kill(worker["Process"], signal.SIGKILL)
alive = False
# Clear it from the database if it's not alive.
if not alive:
db.sync_workers.remove({"_id": worker["_id"]})
# Unlock users attached to it.
db.users.update({"SynchronizationWorker": worker["Process"], "SynchronizationHost": host}, {"$unset":{"SynchronizationWorker": True}}, multi=True)
db.sync_watchdogs.update({"Host": host}, {"Host": host, "Timestamp": datetime.utcnow()}, upsert=True)
close_connections()