memgraph/tests/distributed/jail_service.py
Matej Ferencevic 4ad9cfe1f4 Fix distributed tests exit code
Reviewers: teon.banek, msantl

Reviewed By: teon.banek

Subscribers: pullbot

Differential Revision: https://phabricator.memgraph.io/D1499
2018-11-07 22:46:55 +01:00

163 lines
4.8 KiB
Python
Executable File

#!/usr/bin/env python3
import logging
import os
import signal
import subprocess
import sys
import tempfile
import traceback
import uuid
import xmlrpc.client
# workaround for xmlrpc max/min integer size
xmlrpc.client.MAXINT = 2**100
xmlrpc.client.MININT = -2**100
from common import get_absolute_path
from xmlrpc.server import SimpleXMLRPCServer
try:
import jail
except:
import jail_faker as jail
class XMLRPCServer(SimpleXMLRPCServer):
def _dispatch(self, method, params):
try:
return super()._dispatch(method, params)
except:
traceback.print_exc()
raise
class JailService:
"""
Knows how to start and stop binaries
"""
def __init__(self):
logging.basicConfig(level=logging.INFO)
self.log = logging.getLogger("JailService")
self.log.info("Initializing Jail Service")
self.processes = {}
self._generated_filenames = []
self.tempdir = tempfile.TemporaryDirectory()
self.process_died = False
def _get_proc(self, tid):
if tid not in self.processes:
raise Exception(
"Binary with tid {tid} does not exist".format(tid=tid))
return self.processes[tid]
def start(self, tid, binary_name, binary_args=None):
self.log.info("Starting Binary: {binary}".format(binary=binary_name))
self.log.info("With args: {args}".format(args=binary_args))
# find executable path
binary = get_absolute_path(binary_name, "build")
if not os.path.exists(binary):
# Apollo builds both debug and release binaries on diff
# so we need to use the release binary if the debug one
# doesn't exist
binary = get_absolute_path(binary_name, "build_release")
# fetch process
proc = self._get_proc(tid)
# start binary
proc.run(binary, args=binary_args, timeout=600)
msg = "Binary {binary} successfully started with tid {tid}".format(
binary=binary_name, tid=proc._tid)
self.log.info(msg)
def check_status(self, tid):
proc = self._get_proc(tid)
status = proc.get_status()
if status is None: return True
if status != 0:
self.process_died = True
assert status == 0, "The binary exited with a non-zero status!"
return False
def get_usage(self, tid):
usage = self._get_proc(tid).get_usage()
usage.update({"network": jail.get_network_usage()})
return usage
def wait(self, tid):
proc = self._get_proc(tid)
proc.wait()
def stop(self, tid):
self.log.info("Stopping binary with tid {tid}".format(tid=tid))
proc = self._get_proc(tid)
try:
proc.send_signal(jail.SIGTERM)
except Exception:
pass
proc.wait()
self.log.info("Binary with tid {tid} stopped".format(tid=tid))
def allocate_file(self, extension=""):
if extension != "" and not extension.startswith("."):
extension = "." + extension
tmp_name = str(uuid.uuid4())
while tmp_name in self._generated_filenames:
tmp_name = str(uuid.uuid4())
self._generated_filenames.append(tmp_name)
absolute_path = os.path.join(self.tempdir.name, tmp_name + extension)
return absolute_path
def read_file(self, absolute_path):
with open(absolute_path, "rb") as handle:
return xmlrpc.client.Binary(handle.read())
def get_jail(self):
proc = jail.get_process()
self.processes[proc._tid] = proc
return proc._tid
def store_label(self, label):
jail.store_label(label)
def shutdown(self):
self.log.info("Stopping Jail Service")
for tid in self.processes:
process = self.processes[tid]
if process.get_status() is None:
process.send_signal(jail.SIGTERM)
status = process.wait(check=False)
if status != 0:
self.process_died = True
if self.process_died:
print("A process died!", file=sys.stderr)
os._exit(int(self.process_died))
def main():
# set port dynamically
port = os.environ["CURRENT_MACHINE"][len("MACHINE"):]
port = 8000 + (int(port) * 100)
interface = os.environ[os.environ["CURRENT_MACHINE"]]
# init server
server = XMLRPCServer((interface, port), allow_none=True, logRequests=False)
server.register_introspection_functions()
server.register_instance(JailService())
# signal handler
def signal_sigterm(signum, frame):
server.server_close()
sys.exit()
try:
signal.signal(signal.SIGTERM, signal_sigterm)
server.serve_forever()
except KeyboardInterrupt:
server.server_close()
if __name__ == "__main__":
main()