Source code for distarray.metadata_utils

# encoding: utf-8
# ---------------------------------------------------------------------------
#  Copyright (C) 2008-2014, IPython Development Team and Enthought, Inc.
#  Distributed under the terms of the BSD License.  See COPYING.rst.
# ---------------------------------------------------------------------------

"""
Utility functions for dealing with DistArray metadata.
"""

from __future__ import division

import operator
from itertools import product
from functools import reduce
from numbers import Integral
from collections import Sequence, Mapping

import numpy

from distarray import utils
from distarray.externals.six import next
from distarray.externals.six.moves import map, zip


# Register numpy integer types with numbers.Integral ABC.
Integral.register(numpy.signedinteger)
Integral.register(numpy.unsignedinteger)


[docs]class InvalidGridShapeError(Exception):
    """ Exception class when the grid shape is incompatible with the distribution or communicator. """
    pass


[docs]class GridShapeError(Exception):
    """ Exception class when it is not possible to distribute the processes over the number of dimensions. """
    pass


[docs]def check_grid_shape_preconditions(shape, dist, comm_size):
    """
    Verify various distarray parameters are correct before making a grid_shape.
    """
    if comm_size < 1:
        raise ValueError("comm_size >= 1 not satisfied, comm_size = %s" %
                         (comm_size,))
    if len(shape) != len(dist):
        raise ValueError("len(shape) == len(dist) not satisfied, len(shape) ="
                         " %s and len(dist) = %s" % (len(shape), len(dist)))
    if any(i < 0 for i in shape):
        raise ValueError("shape must be a sequence of non-negative integers, "
                         "shape = %s" % (shape,))
    if any(i not in ('b', 'c', 'n', 'u') for i in dist):
        raise ValueError("dist must be a sequence of 'b', 'n', 'c', 'u' "
                         "strings, dist = %s" % (dist,))


[docs]def check_grid_shape_postconditions(grid_shape, shape, dist, comm_size):
    """ Check grid_shape for reasonableness after creating it. """
    if not (len(grid_shape) == len(shape) == len(dist)):
        raise ValueError("len(gird_shape) == len(shape) == len(dist) not "
                         "satisfied, len(grid_shape) = %s and len(shape) = %s "
                         "and len(dist) = %s" % (len(grid_shape), len(shape),
                                                 len(dist)))
    if any(gs < 1 for gs in grid_shape):
        raise ValueError("all(gs >= 1 for gs in grid_shape) not satisfied, "
                         "grid_shape = %s" % (grid_shape,))
    if any(gs != 1 for (d, gs) in zip(dist, grid_shape) if d == 'n'):
        raise ValueError("all(gs == 1 for (d, gs) in zip(dist, grid_shape) if "
                         "d == 'n', not satified dist = %s and grid_shape = "
                         "%s" % (dist, grid_shape))
    if any(gs > s for (s, gs) in zip(shape, grid_shape) if s > 0):
        raise ValueError("all(gs <= s for (s, gs) in zip(shape, grid_shape) "
                         "if s > 0) not satisfied, shape = %s and grid_shape "
                         "= %s" % (shape, grid_shape))
    if reduce(operator.mul, grid_shape, 1) > comm_size:
        raise ValueError("reduce(operator.mul, grid_shape, 1) <= comm_size not"
                         " satisfied, grid_shape = %s product = %s and "
                         "comm_size = %s" % (
                             grid_shape,
                             reduce(operator.mul, grid_shape, 1),
                             comm_size))


[docs]def normalize_grid_shape(grid_shape, shape, dist, comm_size):
    """Adds 1s to grid_shape so it has `ndims` dimensions.  Validates
    `grid_shape` tuple against the `dist` tuple and `comm_size`.
    """
    def check_normalization_preconditions(grid_shape, dist):
        if any(i < 0 for i in grid_shape):
            raise ValueError("grid_shape must be a sequence of non-negative "
                             "integers, grid_shape = %s" % (grid_shape,))
        if len(grid_shape) > len(dist):
            raise ValueError("len(grid_shape) <= len(dist) not satisfied, "
                             "len(grid_shape) = %s and len(dist) = %s" %
                             (len(grid_shape), len(dist)))
    check_grid_shape_preconditions(shape, dist, comm_size)
    check_normalization_preconditions(grid_shape, dist)

    ndims = len(shape)
    grid_shape = tuple(grid_shape) + (1,) * (ndims - len(grid_shape))

    if len(grid_shape) != len(dist):
        msg = "grid_shape's length (%d) not equal to dist's length (%d)"
        raise InvalidGridShapeError(msg % (len(grid_shape), len(dist)))
    if reduce(operator.mul, grid_shape, 1) > comm_size:
        msg = "grid shape %r not compatible with comm size of %d."
        raise InvalidGridShapeError(msg % (grid_shape, comm_size))
    return grid_shape


[docs]def make_grid_shape(shape, dist, comm_size):
    """ Generate a `grid_shape` from `shape` tuple and `dist` tuple.

    Does not assume that `dim_data` has `proc_grid_size` set for each
    dimension.

    Attempts to allocate processes optimally for distributed dimensions.

    Parameters
    ----------
    shape : tuple of int
        The global shape of the array.
    dist: tuple of str
        dist_type character per dimension.
    comm_size : int
        Total number of processes to distribute.

    Returns
    -------
    dist_grid_shape : tuple of int

    Raises
    ------
    GridShapeError
        if not possible to distribute `comm_size` processes over number of
        dimensions.
    """
    check_grid_shape_preconditions(shape, dist, comm_size)
    distdims = tuple(i for (i, v) in enumerate(dist) if v != 'n')
    ndistdim = len(distdims)

    if ndistdim == 0:
        dist_grid_shape = ()

    elif ndistdim == 1:
        # Trivial case: all processes used for the one distributed dimension.
        if comm_size >= shape[distdims[0]]:
            dist_grid_shape = (shape[distdims[0]],)
        else:
            dist_grid_shape = (comm_size,)

    elif comm_size == 1:
        # Trivial case: only one process to distribute over!
        dist_grid_shape = (1,) * ndistdim

    else:  # Main case: comm_size > 1, ndistdim > 1.
        factors = utils.mult_partitions(comm_size, ndistdim)
        if not factors:  # Can't factorize appropriately.
            raise GridShapeError("Cannot distribute array over processors.")

        reduced_shape = [shape[i] for i in distdims]

        # Reorder factors so they match the relative ordering in reduced_shape
        factors = [utils.mirror_sort(f, reduced_shape) for f in factors]

        # Pick the "best" factoring from `factors` according to which matches
        # the ratios among the dimensions in `shape`.
        rs_ratio = _compute_grid_ratios(reduced_shape)
        f_ratios = [_compute_grid_ratios(f) for f in factors]
        distances = [rs_ratio - f_ratio for f_ratio in f_ratios]
        norms = numpy.array([numpy.linalg.norm(d, 2) for d in distances])
        index = norms.argmin()
        # we now have the grid shape for the distributed dimensions.
        dist_grid_shape = tuple(int(i) for i in factors[index])

    # Create the grid_shape, all 1's for now.
    grid_shape = [1] * len(shape)

    # Fill grid_shape in the distdim slots using dist_grid_shape
    it = iter(dist_grid_shape)
    for distdim in distdims:
        grid_shape[distdim] = next(it)

    out_grid_shape = tuple(grid_shape)
    check_grid_shape_postconditions(out_grid_shape, shape, dist, comm_size)
    return out_grid_shape


def _compute_grid_ratios(shape):
    shape = tuple(map(float, shape))
    n = len(shape)
    ratios = []
    for (i, j) in product(range(n), range(n)):
        if i < j:
            ratios.append(shape[i] / shape[j])
    return numpy.array(ratios)


[docs]def normalize_dist(dist, ndim):
    """Return a tuple containing dist-type for each dimension.

    Parameters
    ----------
    dist : str, list, tuple, or dict
    ndim : int

    Returns
    -------
    tuple of str
        Contains string distribution type for each dim.

    Examples
    --------
    >>> normalize_dist({0: 'b', 3: 'c'}, 4)
    ('b', 'n', 'n', 'c')
    """
    if isinstance(dist, Sequence):
        return tuple(dist) + ('n',) * (ndim - len(dist))
    elif isinstance(dist, Mapping):
        return tuple(dist.get(i, 'n') for i in range(ndim))
    else:
        raise TypeError("Dist must be a string, tuple, list or dict")


def _start_stop_block(size, proc_grid_size, proc_grid_rank):
    """Return `start` and `stop` for a regularly distributed block dim."""
    nelements = size // proc_grid_size
    if size % proc_grid_size != 0:
        nelements += 1

    start = proc_grid_rank * nelements
    if start > size:
        start = size

    stop = start + nelements
    if stop > size:
        stop = size

    return start, stop


[docs]def distribute_block_indices(dd):
    """Fill in `start` and `stop` in dim dict `dd`."""
    if ('start' in dd) and ('stop' in dd):
        return
    else:
        dd['start'], dd['stop'] = _start_stop_block(dd['size'],
                                                    dd['proc_grid_size'],
                                                    dd['proc_grid_rank'])


[docs]def distribute_cyclic_indices(dd):
    """Fill in `start` in dim dict `dd`."""
    if 'start' in dd:
        return
    else:
        dd['start'] = dd['proc_grid_rank']


[docs]def distribute_indices(dd):
    """Fill in index related keys in dim dict `dd`."""
    dist_type = dd['dist_type']
    try:
        {'n': lambda dd: None,
         'b': distribute_block_indices,
         'c': distribute_cyclic_indices}[dist_type](dd)
    except KeyError:
        msg = "dist_type %r not supported."
        raise TypeError(msg % dist_type)


[docs]def normalize_dim_dict(dd):
    """Fill out some degenerate dim_dicts."""

    # TODO: Fill out empty dim_dict alias here?

    if dd['dist_type'] == 'n':
        dd['proc_grid_size'] = 1
        dd['proc_grid_rank'] = 0


def _positivify(index, size):
    """Return a positive index offset from a Sequence's start."""
    if index is None or index >= 0:
        return index
    elif index < 0:
        return size + index


def _check_bounds(index, size):
    """Check if an index is in bounds.

    Assumes a positive index as returned by _positivify.
    """
    if not 0 <= index < size:
        raise IndexError("Index %r out of bounds" % index)


[docs]def tuple_intersection(t0, t1):
    """Compute intersection of a (start, stop, step) and a (start, stop) tuple.

    Assumes all values are positive.

    Parameters
    ----------
    t0: 2-tuple or 3-tuple
        Tuple of (start, stop, [step]) representing an index range
    t1: 2-tuple
        Tuple of (start, stop) representing an index range

    Returns
    -------
    3-tuple or None
        A tightly bounded interval.
    """
    if len(t0) == 2 or t0[2] is None:
        # default step is 1
        t0 = (t0[0], t0[1], 1)

    start0, stop0, step0 = t0
    start1, stop1 = t1
    if start0 < start1:
        n = int(numpy.ceil((start1 - start0) / step0))
        start2 = start0 + n * step0
    else:
        start2 = start0

    max_stop = min(t0[1], t1[1])
    if (max_stop - start2) % step0 == 0:
        n = ((max_stop - start2) // step0) - 1
    else:
        n = (max_stop - start2) // step0
    stop2 = (start2 + n * step0) + 1
    return (start2, stop2, step0) if stop2 > start2 else None


[docs]def positivify(index, size):
    """Check that an index is within bounds and return a positive version.

    Parameters
    ----------
    index : Integral or slice
    size : Integral

    Raises
    ------
    IndexError
        for out-of-bounds indices
    """
    if isinstance(index, Integral):
        index = _positivify(index, size)
        _check_bounds(index, size)
        return index
    elif isinstance(index, slice):
        start = _positivify(index.start, size)
        stop = _positivify(index.stop, size)
        # slice indexing doesn't check bounds
        return slice(start, stop, index.step)
    else:
        raise TypeError("`index` must be of type Integral or slice.")


[docs]def sanitize_indices(indices, ndim=None, shape=None):
    """Classify and sanitize `indices`.

    * Wrap naked Integral, slice, or Ellipsis indices into tuples
    * Classify result as 'value' or 'view'
    * Expand `Ellipsis` objects to slices
    * If the length of the tuple-ized `indices` is < ndim (and it's
      provided),  add slice(None)'s to indices until `indices` is ndim long
    * If `shape` is provided, call `positivify` on the indices

    Raises
    ------
    TypeError
        If `indices` is other than Integral, slice or a Sequence of these
    IndexError
        If len(indices) > ndim

    Returns
    -------
    2-tuple of (str, n-tuple of slices and Integral values)
    """
    if isinstance(indices, Integral):
        rtype, sanitized = 'value', (indices,)
    elif isinstance(indices, slice) or indices is Ellipsis:
        rtype, sanitized = 'view', (indices,)
    elif all(isinstance(i, Integral) for i in indices):
        rtype, sanitized = 'value', indices
    elif all(isinstance(i, Integral)
             or isinstance(i, slice)
             or i is Ellipsis for i in indices):
        rtype, sanitized = 'view', indices
    else:
        msg = ("Index must be an Integral, a slice, or a sequence of "
               "Integrals and slices.")
        raise IndexError(msg)

    if Ellipsis in sanitized:
        if ndim is None:
            raise RuntimeError("Can't call `sanitize_indices` on Ellipsis "
                               "without providing `ndim`.")
        # expand first Ellipsis
        diff = ndim - (len(sanitized) - 1)
        filler = (slice(None),) * diff
        epos = sanitized.index(Ellipsis)
        sanitized = sanitized[:epos] + filler + sanitized[epos + 1:]

        # remaining Ellipsis objects are just converted to slices
        def replace_ellipsis(idx):
            if idx is Ellipsis:
                return slice(None)
            else:
                return idx
        sanitized = tuple(replace_ellipsis(i) for i in sanitized)

    if ndim is not None:
        diff = ndim - len(sanitized)
        if diff < 0:
            raise IndexError("Too many indices.")
        if diff > 0:
            # allow incomplete indexing
            rtype = 'view'
            sanitized = sanitized + (slice(None),) * diff

    if shape is not None:
        sanitized = tuple(positivify(i, size) for (i, size) in zip(sanitized,
                                                                   shape))
    return (rtype, sanitized)


[docs]def normalize_reduction_axes(axes, ndim):
    if axes is None:
        axes = tuple(range(ndim))
    elif not isinstance(axes, Sequence):
        axes = (positivify(axes, ndim),)
    else:
        axes = tuple(positivify(a, ndim) for a in axes)
    return axes


# Functions for getting a size from a dim_data for each dist_type.
# n
[docs]def non_dist_size(dim_data):
    """ Get a size from a nondistributed dim_data. """
    return dim_data['size']


# b
[docs]def block_size(dim_data):
    """ Get a size from a block distributed dim_data. """
    stop = dim_data['stop']
    start = dim_data['start']
    return stop - start


# Choose cyclic or block cyclic based on block size. This is necessary
# because they have the same dist type character.
[docs]def c_or_bc_chooser(dim_data):
    """ Get a size from a cyclic or block-cyclic dim_data. """
    block_size = dim_data.get('block_size', 1)
    if block_size == 1:
        return cyclic_size(dim_data)
    elif block_size > 1:
        return block_cyclic_size(dim_data)
    else:
        raise ValueError("block_size %s is invalid" % block_size)


# c
[docs]def cyclic_size(dim_data):
    """ Get a size from a cyclic dim_data. """
    global_size = dim_data['size']
    grid_rank = dim_data.get('proc_grid_rank', 0)
    grid_size = dim_data.get('proc_grid_size', 1)
    return (global_size - 1 - grid_rank) // grid_size + 1


# c
[docs]def block_cyclic_size(dim_data):
    """ Get a size from a block-cyclic dim_data. """
    global_size = dim_data['size']
    block_size = dim_data.get('block_size', 1)
    grid_size = dim_data.get('proc_grid_size', 1)
    grid_rank = dim_data.get('proc_grid_rank', 0)

    global_nblocks, partial = divmod(global_size, block_size)
    local_partial = partial if grid_rank == 0 else 0
    local_nblocks = (global_nblocks - 1 - grid_rank) // grid_size + 1
    return local_nblocks * block_size + local_partial


# u
[docs]def unstructured_size(dim_data):
    """ Get a size from an unstructured dim_data. """
    return len(dim_data.get('indices', None))


[docs]def size_from_dim_data(dim_data):
    """
    Get a size from a dim_data.
    """
    return size_chooser(dim_data['dist_type'])(dim_data)


[docs]def size_chooser(dist_type):
    """
    Get a function from a dist_type.
    """
    chooser = {'n': non_dist_size,
               'b': block_size,
               'c': c_or_bc_chooser,
               'u': unstructured_size}
    return chooser[dist_type]


[docs]def shapes_from_dim_data_per_rank(ddpr):  # ddpr = dim_data_per_rank
    """
    Given a dim_data_per_rank object, return the shapes of the localarrays.
    This requires no communication.
    """
    # create the list of shapes
    shape_list = []
    for rank_dd in ddpr:
        shape = []
        for dd in rank_dd:
            shape.append(size_from_dim_data(dd))
        shape_list.append(tuple(shape))
    return shape_list

# ----------------------------------------------------------------------------
# Redistribution-related utilities.
# ----------------------------------------------------------------------------

def _accum(start, next):
    return tuple(s * next for s in start) + (next,)

[docs]def strides_from_shape(shape):
    return reduce(_accum, tuple(shape[1:]) + (1,), ())

[docs]def ndim_from_flat(flat, strides):
    res = []
    for st in strides:
        res.append(flat // st)
        flat %= st
    return tuple(res)

def _squeeze(accum, next):
    last = accum[-1]
    if not last:
        return [next]
    elif last[-1] != next[0]:
        return accum + [next]
    elif last[-1] == next[0]:
        return accum[:-1] + [(last[0], next[-1])]

[docs]def condense(intervals):
    intervals = reduce(_squeeze, intervals, [[]])
    return intervals

# ----------------------------------------------------------------------------
# `apply` related utilities.
# ----------------------------------------------------------------------------

[docs]def arg_kwarg_proxy_converter(args, kwargs, module_name='__main__'):
    from importlib import import_module

    module = import_module(module_name)
    # convert args

    # In some situations, like redistributing a DistArray from one set of
    # targets to a disjoint set, the source and destination DistArrays (and
    # associated LocalArrays) are in different communicators with different
    # targets.  In those cases, it is possible for a proxy object for one
    # DistArray to not refer to anything on this target.  In that case,
    # `a.dereference()` raises an `AttributeError`.  We intercept that here and
    # assign `None` instead.

    args = list(args)
    for i, a in enumerate(args):
        if isinstance(a, module.Proxy):
            try:
                args[i] = a.dereference()
            except AttributeError:
                args[i] = None
    args = tuple(args)

    # convert kwargs
    for k in kwargs.keys():
        val = kwargs[k]
        if isinstance(val, module.Proxy):
            try:
                kwargs[k] = val.dereference()
            except AttributeError:
                kwargs[k] = None

    return args, kwargs