X-Git-Url: https://wannabe.guru.org/gitweb/?a=blobdiff_plain;f=remote_worker.py;h=82b80ea3d722090ab7254eb24eac5884a9520172;hb=eb1c6392095947b3205c4d52cd9b1507e6cd776b;hp=bf8de6c66a36767ac267cfdd2bffe38317cbace0;hpb=9821d383ba3de886f8d11d00a588e49c2c280579;p=python_utils.git diff --git a/remote_worker.py b/remote_worker.py index bf8de6c..82b80ea 100755 --- a/remote_worker.py +++ b/remote_worker.py @@ -6,11 +6,11 @@ results. import logging import os -import platform import signal -import threading import sys +import threading import time +from typing import Optional import cloudpickle # type: ignore import psutil # type: ignore @@ -18,9 +18,9 @@ import psutil # type: ignore import argparse_utils import bootstrap import config +from stopwatch import Timer from thread_utils import background_thread - logger = logging.getLogger(__file__) cfg = config.add_commandline_args( @@ -32,28 +32,25 @@ cfg.add_argument( type=str, required=True, metavar='FILENAME', - help='The location of the bundle of code to execute.' + help='The location of the bundle of code to execute.', ) cfg.add_argument( '--result_file', type=str, required=True, metavar='FILENAME', - help='The location where we should write the computation results.' + help='The location where we should write the computation results.', ) cfg.add_argument( '--watch_for_cancel', action=argparse_utils.ActionNoYes, - default=False, - help='Should we watch for the cancellation of our parent ssh process?' + default=True, + help='Should we watch for the cancellation of our parent ssh process?', ) @background_thread def watch_for_cancel(terminate_event: threading.Event) -> None: - if platform.node() == 'VIDEO-COMPUTER': - logger.warning('Background thread not allowed on retarded computers, sorry.') - return logger.debug('Starting up background thread...') p = psutil.Process(os.getpid()) while True: @@ -67,7 +64,9 @@ def watch_for_cancel(terminate_event: threading.Event) -> None: saw_sshd = True break if not saw_sshd: - logger.error('Did not see sshd in our ancestors list?! Committing suicide.') + logger.error( + 'Did not see sshd in our ancestors list?! Committing suicide.' + ) os.system('pstree') os.kill(os.getpid(), signal.SIGTERM) time.sleep(5.0) @@ -78,12 +77,27 @@ def watch_for_cancel(terminate_event: threading.Event) -> None: time.sleep(1.0) +def cleanup_and_exit( + thread: Optional[threading.Thread], + stop_thread: Optional[threading.Event], + exit_code: int, +) -> None: + if stop_thread is not None: + stop_thread.set() + assert thread is not None + thread.join() + sys.exit(exit_code) + + @bootstrap.initialize def main() -> None: in_file = config.config['code_file'] out_file = config.config['result_file'] - (thread, stop_thread) = watch_for_cancel() + thread = None + stop_thread = None + if config.config['watch_for_cancel']: + (thread, stop_thread) = watch_for_cancel() logger.debug(f'Reading {in_file}.') try: @@ -92,8 +106,7 @@ def main() -> None: except Exception as e: logger.exception(e) logger.critical(f'Problem reading {in_file}. Aborting.') - stop_thread.set() - sys.exit(-1) + cleanup_and_exit(thread, stop_thread, 1) logger.debug(f'Deserializing {in_file}.') try: @@ -101,14 +114,12 @@ def main() -> None: except Exception as e: logger.exception(e) logger.critical(f'Problem deserializing {in_file}. Aborting.') - stop_thread.set() - sys.exit(-1) + cleanup_and_exit(thread, stop_thread, 2) logger.debug('Invoking user code...') - start = time.time() - ret = fun(*args, **kwargs) - end = time.time() - logger.debug(f'User code took {end - start:.1f}s') + with Timer() as t: + ret = fun(*args, **kwargs) + logger.debug(f'User code took {t():.1f}s') logger.debug('Serializing results') try: @@ -116,8 +127,7 @@ def main() -> None: except Exception as e: logger.exception(e) logger.critical(f'Could not serialize result ({type(ret)}). Aborting.') - stop_thread.set() - sys.exit(-1) + cleanup_and_exit(thread, stop_thread, 3) logger.debug(f'Writing {out_file}.') try: @@ -126,11 +136,8 @@ def main() -> None: except Exception as e: logger.exception(e) logger.critical(f'Error writing {out_file}. Aborting.') - stop_thread.set() - sys.exit(-1) - - stop_thread.set() - thread.join() + cleanup_and_exit(thread, stop_thread, 4) + cleanup_and_exit(thread, stop_thread, 0) if __name__ == '__main__':