#!/usr/bin/env python3

# © Copyright 2021-2023, Scott Gasch

"""A decorator to help with simple parallelization.  When decorated
functions are invoked they execute on a background thread, process or
remote machine depending on the style of decoration::

    from pyutils.parallelize import parallelize as p

    @p.parallelize    # defaults to thread-mode
    def my_function(a, b, c) -> int:
        ...do some slow / expensive work, e.g., an http request

    # Run with background subprocess
    @p.parallelize(method=Method.PROCESS)
    def my_other_function(d, e, f) -> str:
        ...do more really expensive work, e.g., a network read

    # Run in a helper process on another machine.
    @p.parallelize(method=Method.REMOTE)
    def my_other_other_function(g, h) -> int:
        ...this work will be distributed to a remote machine pool

This will just work out of the box with `Method.THREAD` (the default)
and `Method.PROCESS` but in order to use `Method.REMOTE` you need to
do some setup work:

    1. To use `@parallelize(method=Method.REMOTE)` with your code you
       need to hook your code into :mod:`pyutils.config` to enable
       commandline flags from `pyutil` files.  You can do this by
       either wrapping your main entry point with the
       :meth:`pyutils.bootstrap.initialize` decorator or just calling
       `config.parse()` early in your program.  See instructions in
       :mod:`pyutils.bootstrap` and :mod:`pyutils.config` for
       more information.

    2. You need to create and configure a pool of worker machines.
       All of these machines should run the same version of Python,
       ideally in a virtual environment (venv) with the same
       Python dependencies installed.  See: https://docs.python.org/3/library/venv.html

       .. warning::

           Different versions of code, libraries, or of the interpreter
           itself can cause issues with running cloudpicked code.

    3. You need an account that can ssh into any / all of these pool
       machines non-interactively to perform tasks such as copying
       code to the worker machine and running Python in the
       aforementioned virtual environment.  This likely means setting
       up `ssh` / `scp` with key-based authentication.
       See: https://www.digitalocean.com/community/tutorials/how-to-set-up-ssh-keys-2

    4. You need to tell this parallelization framework about the pool
       of machines you created by editing a JSON-based configuration
       file.  The location of this file defaults to
       :file:`.remote_worker_records` in your home directory but can
       be overridden via the `--remote_worker_records_file`
       commandline argument.  An example JSON configuration `can be
       found under examples
       <https://wannabe.guru.org/gitweb/?p=pyutils.git;a=blob_plain;f=examples/parallelize_config/.remote_worker_records;hb=HEAD>`_.

    5. Finally, you will also need tell the
       :class:`pyutils.parallelize.executors.RemoteExecutor` how to
       invoke the :file:`remote_worker.py` on remote machines by
       passing its path on remote worker machines in your setup via
       the `--remote_worker_helper_path` commandline flag (or,
       honestly, if you made it this far, just update the default in
       this code -- find `executors.py` under `site-packages` in your
       virtual environment and update the default value of the
       `--remote_worker_helper_path` flag)

    If you're trying to set this up and struggling, email me at
    scott.gasch@gmail.com.  I'm happy to help.

    What you get back when you call a decorated function (using
    threads, processes or a remote worker) is a
    :class:`pyutils.parallelize.smart_future.SmartFuture`.  This class
    attempts to transparently wrap a normal Python :class:`Future`
    (see
    https://docs.python.org/3/library/concurrent.futures.html#future-objects).
    If your code just uses the result of a `parallelized` method it
    will block waiting on the result of the wrapped function as soon
    as it uses that result in a manner that requires its value to be
    known (e.g. using it in an expression, calling a method on it,
    passing it into a method, hashing it / using it as a dict key,
    etc...)  But you can do operations that do not require the value
    to be known (e.g. storing it in a list, storing it as a value in a
    dict, etc...) safely without blocking.

    There are two helper methods in
    :mod:`pyutils.parallelize.smart_future` to help deal with these
    :class:`SmartFuture` objects called
    :meth:`pyutils.parallelize.smart_future.wait_all` and
    :meth:`pyutils.parallelize.smart_future.wait_any`.  These, when
    given a collection of :class:`SmartFuture` objects,
    will block until one (any) or all (all) are finished and yield the
    finished objects to the caller.  Callers can be confident that any
    objects returned from these methods will not block when accessed.
    See documentation in :mod:`pyutils.parallelize.smart_future` for
    more details.

"""

import atexit
import functools
import typing
from enum import Enum


class Method(Enum):
    """How should we parallelize; by threads, processes or remote workers?"""

    THREAD = 1
    PROCESS = 2
    REMOTE = 3


def parallelize(
    _funct: typing.Optional[typing.Callable] = None, *, method: Method = Method.THREAD
) -> typing.Callable:
    """This is a decorator that was created to make multi-threading,
    multi-processing and remote machine parallelism simple in Python.

    Sample usage::

        from pyutils.parallelize import parallelize as p

        @p.parallelize    # defaults to thread-mode
        def my_function(a, b, c) -> int:
            ...do some slow / expensive work, e.g., an http request

        # Run with background subprocess
        @p.parallelize(method=Method.PROCESS)
        def my_other_function(d, e, f) -> str:
            ...do more really expensive work, e.g., a network read

        # Run in a helper process on another machine.
        @p.parallelize(method=Method.REMOTE)
        def my_other_other_function(g, h) -> int:
            ...this work will be distributed to a remote machine pool

    This decorator will invoke the wrapped function on:

        - `Method.THREAD` (default): a background thread
        - `Method.PROCESS`: a background process
        - `Method.REMOTE`: a process on a remote host

    The wrapped function returns immediately with a value that is
    wrapped in a
    :class:`pyutils.parallelize.smart_future.SmartFuture`.  This value
    will block if it is either read directly (via a call to
    :meth:`_resolve`) or indirectly (by using the result in an
    expression, printing it, hashing it, passing it a function
    argument, etc...).  See comments on :class:`SmartFuture` for
    details.  The value can be safely stored (without hashing) or
    passed as an argument without causing it to block waiting on a
    result.  There are some convenience methods for dealing with
    collections of :class:`SmartFuture` objects defined in
    :file:`smart_future.py`, namely
    :meth:`pyutils.parallelize.smart_future.wait_any` and
    :meth:`pyutils.parallelize.smart_future.wait_all`.

    .. warning::
        You may stack @parallelized methods and it will "work".
        That said, having multiple layers of :code:`Method.PROCESS` or
        :code:`Method.REMOTE` will prove to be problematic because each
        process in the stack will use its own independent pool which will
        likely overload your machine with processes or your network with
        remote processes beyond the control mechanisms built into one
        instance of the pool.  Be careful.

    .. warning::
        There is non-trivial overhead of pickling code and
        copying it over the network when you use :code:`Method.REMOTE`.  There's
        a smaller but still considerable cost of creating a new process
        and passing code to/from it when you use :code:`Method.PROCESS`.

    """

    def wrapper(funct: typing.Callable):
        @functools.wraps(funct)
        def inner_wrapper(*args, **kwargs):
            from pyutils.parallelize import executors, smart_future

            # Look for as of yet unresolved arguments in _funct's
            # argument list and resolve them now.
            newargs = []
            for arg in args:
                newargs.append(smart_future.SmartFuture.resolve(arg))
            newkwargs = {}
            for kw in kwargs:
                newkwargs[kw] = smart_future.SmartFuture.resolve(kwargs[kw])

            executor = None
            if method == Method.PROCESS:
                executor = executors.DefaultExecutors().process_pool()
            elif method == Method.THREAD:
                executor = executors.DefaultExecutors().thread_pool()
            elif method == Method.REMOTE:
                executor = executors.DefaultExecutors().remote_pool()
            assert executor is not None
            atexit.register(executors.DefaultExecutors().shutdown)

            future = executor.submit(funct, *newargs, **newkwargs)

            # Wrap the future that's returned in a SmartFuture object
            # so that callers do not need to call .result(), they can
            # just use is as normal.
            return smart_future.SmartFuture(future)

        return inner_wrapper

    if _funct is None:
        return wrapper
    else:
        return wrapper(_funct)