Source code for lasif.tools.parallel_helpers

#!/usr/bin/env python
# -*- coding: utf-8 -*-
"""
Helpers for embarrassingly parallel calculations using MPI. All functions
works just fine when running on one core and not started with MPI.

:copyright:
    Lion Krischer (krischer@geophysik.uni-muenchen.de), 2014-2015
:license:
    GNU Lesser General Public License, Version 3
    (http://www.gnu.org/copyleft/lesser.html)
"""
import collections
import colorama
import functools
import inspect
import itertools
import os
import sys
import traceback
import warnings

from mpi4py import MPI


[docs]class FunctionInfo(collections.namedtuple(
    "FunctionInfo", ["func_args", "result", "warnings", "exception",
                     "traceback"])):
    """
    Namedtuple used to collect information about a function execution.

    It has the following fields: ``func_args``, ``result``, ``warnings``,
    ``exception``, and ``traceback``.
    """
    pass


[docs]def function_info(traceback_limit=10):
    """
    Decorator collecting information during the execution of a function.

    This is useful for collecting information about a function runnning on a
    number of processes/machines.

    It returns a FunctionInfo named tuple with the following fields:

    * ``func_args``: Dictionary containing all the functions arguments and
      values.
    * ``result``: The return value of the function. Will be None if an
      exception has been raised.
    * ``warnings``: A list with all warnings the function raised.
    * ``exception``: The exception the function raised. Will be None, if no
      exception has been raised.
    * ``traceback``: The full traceback in case an exception occured as a
      string.
      A traceback object is not serializable thus a string is used.


    >>> @function_info()
    ... def test(a, b=2):
    ...     return a / b
    >>> info = test(4, 1)
    >>> info.func_args
    {'a': 4, 'b': 1}
    >>> info.result
    4

    ``warnings`` is empty if no warning has been raised. Otherwise it will
    collect all warnings.

    >>> info.warnings
    []

    ``exception`` and ``traceback`` are ``None`` if the function completed
    successfully.

    >>> info.exception
    >>> info.traceback
    """
    def _function_info(f):
        @functools.wraps(f)
        def wrapper(*args, **kwargs):
            with warnings.catch_warnings(record=True) as w:
                warnings.simplefilter("always")
                result = None
                exception = None
                tb = None
                func_args = inspect.getcallargs(f, *args, **kwargs)
                try:
                    result = f(*args, **kwargs)
                except Exception as e:
                    # With help from http://stackoverflow.com/a/14528175.
                    exc_info = sys.exc_info()
                    stack = traceback.extract_stack(limit=traceback_limit)
                    tb = traceback.extract_tb(exc_info[2])
                    full_tb = stack[:-1] + tb
                    exc_line = traceback.format_exception_only(*exc_info[:2])
                    tb = "Traceback (%i levels - most recent call last):\n" % \
                        traceback_limit
                    tb += "".join(traceback.format_list(full_tb))
                    tb += "\n"
                    tb += "".join(exc_line)
                    exception = e

            return FunctionInfo(
                func_args=func_args,
                result=result,
                exception=exception,
                warnings=w,
                traceback=tb)

        return wrapper
    return _function_info


def _execute_wrapped_function(func, parameters):
    """
    Helper function to execute the same function but wrapper with the
    function_info decorator.

    This is necessary as a function needs to be importable, otherwise pickle
    does not work with it.
    """
    return function_info()(func)(**parameters)


[docs]def distribute_across_ranks(function, items, get_name, logfile):
    """
    Calls a function once for each item.

    It will be distributed across MPI ranks if launched with MPI.

    :param function: The function to be executed for each item.
    :param items: The function will be executed once for each item. It
        expects a list of dictionaries so that ``function(**item)`` can work.
        Only rank 0 needs to pass this. It will be ignored coming from other
        ranks.
    :param get_name: Function to extract a name for each item to be able to
        produce better logfiles.
    :param logfile: The logfile to write.
    """
    def split(container, count):
        """
        Simple and elegant function splitting a container into count
        equal chunks.

        Order is not preserved but for the use case at hand this is
        potentially an advantage as data sitting in the same folder thus
        have a higher at being processed at the same time thus the disc
        head does not have to jump around so much. Of course very
        architecture dependent.
        """
        return [container[_i::count] for _i in range(count)]

    # Rank zero collects what needs to be done and distributes it across
    # all cores.
    if MPI.COMM_WORLD.rank == 0:
        total_length = len(items)
        items = split(items, MPI.COMM_WORLD.size)
    else:
        items = None

    # Now each rank knows what it has to process. This still works
    # nicely with only one core, the overhead is negligible.
    items = MPI.COMM_WORLD.scatter(items, root=0)

    results = []

    for _i, item in enumerate(items):
        results.append(_execute_wrapped_function(function, item))

        if MPI.COMM_WORLD.rank == 0:
            print("Approximately %i of %i items have been processed." % (
                min((_i + 1) * MPI.COMM_WORLD.size, total_length),
                total_length))

    results = MPI.COMM_WORLD.gather(results, root=0)

    if MPI.COMM_WORLD.rank != 0:
        return

    results = list(itertools.chain.from_iterable(results))

    successful_file_count = 0
    warning_file_count = 0
    failed_file_count = 0
    total_file_count = len(results)

    # Log the results.
    with open(logfile, "wt") as fh:
        for result in results:
            fh.write("\n============\nItem: %s" % get_name(result.func_args))
            has_exception = False
            has_warning = False
            if result.exception:
                has_exception = True
                fh.write("\n")
                fh.write(result.traceback)
            elif result.warnings:
                has_warning = True
                for w in result.warnings:
                    fh.write("\nWarning: %s\n" % str(w))
            else:
                fh.write(" - SUCCESS")

            if has_exception:
                failed_file_count += 1
            elif has_warning:
                warning_file_count += 1
            else:
                successful_file_count += 1

        print("\nFinished processing %i items. See the logfile for "
              "details.\n" % total_file_count)
        print("\t%s%i files failed being processed.%s" %
              (colorama.Fore.RED, failed_file_count,
               colorama.Fore.RESET))
        print("\t%s%i files raised warnings while being processed.%s" %
              (colorama.Fore.YELLOW, warning_file_count,
               colorama.Fore.RESET))
        print("\t%s%i files have been processed without errors or warnings%s" %
              (colorama.Fore.GREEN, successful_file_count,
               colorama.Fore.RESET))

        print("\nLogfile written to '%s'." % os.path.relpath(logfile))

    return results