lightning/pytorch_lightning/metrics/converters.py

"""
This file provides functions and decorators for automated input and output
conversion to/from :class:`numpy.ndarray` and :class:`torch.Tensor` as well as utilities to
sync tensors between different processes in a DDP scenario, when needed.
"""

import sys
import numbers
from typing import Union, Any, Callable, Optional

import numpy as np
import torch
from torch.utils.data._utils.collate import np_str_obj_array_pattern

from pytorch_lightning.utilities.apply_func import apply_to_collection


def _apply_to_inputs(func_to_apply: Callable, *dec_args, **dec_kwargs) -> Callable:
    """
    Decorator function to apply a function to all inputs of a function.
    Args:
        func_to_apply: the function to apply to the inputs
        *dec_args: positional arguments for the function to be applied
        **dec_kwargs: keyword arguments for the function to be applied

    Returns:
        the decorated function
    """

    def decorator_fn(func_to_decorate):
        # actual function applying the give function to inputs
        def new_func(*args, **kwargs):
            args = func_to_apply(args, *dec_args, **dec_kwargs)
            kwargs = func_to_apply(kwargs, *dec_args, **dec_kwargs)
            return func_to_decorate(*args, **kwargs)

        return new_func

    return decorator_fn


def _apply_to_outputs(func_to_apply: Callable, *dec_args, **dec_kwargs) -> Callable:
    """
    Decorator function to apply a function to all outputs of a function.
    Args:
        func_to_apply: the function to apply to the outputs
        *dec_args: positional arguments for the function to be applied
        **dec_kwargs: keyword arguments for the function to be applied

    Returns:
        the decorated function
    """

    def decorator_fn(function_to_decorate):
        # actual function applying the give function to outputs
        def new_func(*args, **kwargs):
            result = function_to_decorate(*args, **kwargs)
            return func_to_apply(result, *dec_args, **dec_kwargs)

        return new_func

    return decorator_fn


def _convert_to_tensor(data: Any) -> Any:
    """
    Maps all kind of collections and numbers to tensors.

    Args:
        data: the data to convert to tensor

    Returns:
        the converted data

    """
    if isinstance(data, numbers.Number):
        return torch.tensor([data])
    # is not array of object
    elif isinstance(data, np.ndarray) and np_str_obj_array_pattern.search(data.dtype.str) is None:
        return torch.from_numpy(data)
    elif isinstance(data, torch.Tensor):
        return data

    raise TypeError(f"The given type ('{type(data).__name__}') cannot be converted to a tensor!")


def _convert_to_numpy(data: Union[torch.Tensor, np.ndarray, numbers.Number]) -> np.ndarray:
    """Convert all tensors and numpy arrays to numpy arrays.
    Args:
        data: the tensor or array to convert to numpy

    Returns:
        the resulting numpy array

    """
    if isinstance(data, torch.Tensor):
        return data.cpu().detach().numpy()
    elif isinstance(data, numbers.Number):
        return np.array([data])
    elif isinstance(data, np.ndarray):
        return data

    raise TypeError("The given type ('%s') cannot be converted to a numpy array!" % type(data).__name__)


def _numpy_metric_conversion(func_to_decorate: Callable) -> Callable:
    """
    Decorator handling the argument conversion for metrics working on numpy.
    All inputs of the decorated function will be converted to numpy and all
    outputs will be converted to tensors.

    Args:
        func_to_decorate: the function whose inputs and outputs shall be converted

    Returns:
        the decorated function

    """
    # applies collection conversion from tensor to numpy to all inputs
    # we need to include numpy arrays here, since otherwise they will also be treated as sequences
    func_convert_inputs = _apply_to_inputs(
        apply_to_collection, (torch.Tensor, np.ndarray, numbers.Number), _convert_to_numpy)(func_to_decorate)
    # converts all inputs back to tensors (device doesn't matter here, since this is handled by BaseMetric)
    func_convert_in_out = _apply_to_outputs(_convert_to_tensor)(func_convert_inputs)
    return func_convert_in_out


def _tensor_metric_conversion(func_to_decorate: Callable) -> Callable:
    """
    Decorator Handling the argument conversion for metrics working on tensors.
    All inputs and outputs of the decorated function will be converted to tensors

    Args:
        func_to_decorate: the function whose inputs and outputs shall be converted

    Returns:
        the decorated function

    """
    # converts all inputs to tensor if possible
    # we need to include tensors here, since otherwise they will also be treated as sequences
    func_convert_inputs = _apply_to_inputs(
        apply_to_collection, (torch.Tensor, np.ndarray, numbers.Number), _convert_to_tensor)(func_to_decorate)
    # convert all outputs to tensor if possible
    return _apply_to_outputs(_convert_to_tensor)(func_convert_inputs)


def _sync_ddp_if_available(result: Union[torch.Tensor],
                           group: Optional[Any] = None,
                           reduce_op: Optional[torch.distributed.ReduceOp] = None,
                           ) -> torch.Tensor:
    """
    Function to reduce the tensors from several ddp processes to one master process

    Args:
        result: the value to sync and reduce (typically tensor or number)
        group: the process group to gather results from. Defaults to all processes (world)
        reduce_op: the reduction operation. Defaults to sum.

    Returns:
        reduced value

    """

    if torch.distributed.is_available() and torch.distributed.is_initialized():
        if group is None:
            group = torch.distributed.group.WORLD

        if reduce_op is None:
            reduce_op = torch.distributed.ReduceOp.SUM

        # sync all processes before reduction
        torch.distributed.barrier(group=group)
        torch.distributed.all_reduce(result, op=reduce_op, group=group,
                                     async_op=False)

    return result


def numpy_metric(group: Optional[Any] = None,
                 reduce_op: Optional[torch.distributed.ReduceOp] = None) -> Callable:
    """
    This decorator shall be used on all function metrics working on numpy arrays.

    It handles the argument conversion and DDP reduction for metrics working on numpy.
    All inputs of the decorated function will be converted to numpy and all
    outputs will be converted to tensors.
    In DDP Training all output tensors will be reduced according to the given rules.

    Args:
        group: the process group to gather results from. Defaults to all processes (world)
        reduce_op: the reduction operation. Defaults to sum

    Returns:
        the decorated function

    """

    def decorator_fn(func_to_decorate):
        return _apply_to_outputs(apply_to_collection, torch.Tensor, _sync_ddp_if_available,
                                 group=group,
                                 reduce_op=reduce_op)(_numpy_metric_conversion(func_to_decorate))

    return decorator_fn


def tensor_metric(group: Optional[Any] = None,
                  reduce_op: Optional[torch.distributed.ReduceOp] = None) -> Callable:
    """
    This decorator shall be used on all function metrics working on tensors.

    It handles the argument conversion and DDP reduction for metrics working on tensors.
    All inputs and outputs of the decorated function will be converted to tensors.
    In DDP Training all output tensors will be reduced according to the given rules.

    Args:
       group: the process group to gather results from. Defaults to all processes (world)
       reduce_op: the reduction operation. Defaults to sum

    Returns:
       the decorated function

    """

    def decorator_fn(func_to_decorate):
        return _apply_to_outputs(apply_to_collection, torch.Tensor, _sync_ddp_if_available,
                                 group=group,
                                 reduce_op=reduce_op)(_tensor_metric_conversion(func_to_decorate))

    return decorator_fn
New metric classes (#1326) (#1877) * New metric classes (#1326) * Create metrics package * Create metric.py * Create utils.py * Create __init__.py * add tests for metric utils * add docstrings for metrics utils * add function to recursively apply other function to collection * add tests for this function * update test * Update pytorch_lightning/metrics/metric.py Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * update metric name * remove example docs * fix tests * add metric tests * fix to tensor conversion * fix apply to collection * Update CHANGELOG.md * Update pytorch_lightning/metrics/metric.py Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * remove tests from init * add missing type annotations * rename utils to convertors * Create metrics.rst * Update index.rst * Update index.rst * Update pytorch_lightning/metrics/convertors.py Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * Update pytorch_lightning/metrics/convertors.py Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * Update pytorch_lightning/metrics/convertors.py Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * Update pytorch_lightning/metrics/metric.py Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * Update tests/utilities/test_apply_to_collection.py Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * Update tests/utilities/test_apply_to_collection.py Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * Update tests/metrics/convertors.py Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * Apply suggestions from code review Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * add doctest example * rename file and fix imports * added parametrized test * replace lambda with inlined function * rename apply_to_collection to apply_func * Separated class description from init args * Apply suggestions from code review Co-Authored-By: Jirka Borovec <Borda@users.noreply.github.com> * adjust random values * suppress output when seeding * remove gpu from doctest * Add requested changes and add ellipsis for doctest * forgot to push these files... * add explicit check for dtype to convert to * fix ddp tests * remove explicit ddp destruction Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com> * move dtype device mixin to more general place * refactor to general device dtype mixin * add initial metric package description * change default to none for mac os * pep8 * fix import * Update index.rst * Update ci-testing.yml * Apply suggestions from code review Co-authored-by: Adrian Wälchli <aedu.waelchli@gmail.com> * Update CHANGELOG.md * Update pytorch_lightning/metrics/converters.py * readme * Update metric.py * Update pytorch_lightning/metrics/converters.py Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com> Co-authored-by: William Falcon <waf2107@columbia.edu> Co-authored-by: Adrian Wälchli <aedu.waelchli@gmail.com> Co-authored-by: Jirka <jirka@pytorchlightning.ai> 2020-05-19 15:05:07 +00:00			`"""`
			`This file provides functions and decorators for automated input and output`
			conversion to/from :class:`numpy.ndarray` and :class:`torch.Tensor` as well as utilities to
			`sync tensors between different processes in a DDP scenario, when needed.`
			`"""`

			`import sys`
			`import numbers`
			`from typing import Union, Any, Callable, Optional`

			`import numpy as np`
			`import torch`
			`from torch.utils.data._utils.collate import np_str_obj_array_pattern`

			`from pytorch_lightning.utilities.apply_func import apply_to_collection`


			`def _apply_to_inputs(func_to_apply: Callable, dec_args, *dec_kwargs) -> Callable:`
			`"""`
			`Decorator function to apply a function to all inputs of a function.`
			`Args:`
			`func_to_apply: the function to apply to the inputs`
			`*dec_args: positional arguments for the function to be applied`
			`**dec_kwargs: keyword arguments for the function to be applied`

			`Returns:`
			`the decorated function`
			`"""`

			`def decorator_fn(func_to_decorate):`
			`# actual function applying the give function to inputs`
			`def new_func(args, *kwargs):`
			`args = func_to_apply(args, dec_args, *dec_kwargs)`
			`kwargs = func_to_apply(kwargs, dec_args, *dec_kwargs)`
			`return func_to_decorate(args, *kwargs)`

			`return new_func`

			`return decorator_fn`


			`def _apply_to_outputs(func_to_apply: Callable, dec_args, *dec_kwargs) -> Callable:`
			`"""`
			`Decorator function to apply a function to all outputs of a function.`
			`Args:`
			`func_to_apply: the function to apply to the outputs`
			`*dec_args: positional arguments for the function to be applied`
			`**dec_kwargs: keyword arguments for the function to be applied`

			`Returns:`
			`the decorated function`
			`"""`

			`def decorator_fn(function_to_decorate):`
			`# actual function applying the give function to outputs`
			`def new_func(args, *kwargs):`
			`result = function_to_decorate(args, *kwargs)`
			`return func_to_apply(result, dec_args, *dec_kwargs)`

			`return new_func`

			`return decorator_fn`


			`def _convert_to_tensor(data: Any) -> Any:`
			`"""`
			`Maps all kind of collections and numbers to tensors.`

			`Args:`
			`data: the data to convert to tensor`

			`Returns:`
			`the converted data`

			`"""`
			`if isinstance(data, numbers.Number):`
			`return torch.tensor([data])`
			`# is not array of object`
			`elif isinstance(data, np.ndarray) and np_str_obj_array_pattern.search(data.dtype.str) is None:`
			`return torch.from_numpy(data)`
			`elif isinstance(data, torch.Tensor):`
			`return data`

			`raise TypeError(f"The given type ('{type(data).__name__}') cannot be converted to a tensor!")`


			`def _convert_to_numpy(data: Union[torch.Tensor, np.ndarray, numbers.Number]) -> np.ndarray:`
			`"""Convert all tensors and numpy arrays to numpy arrays.`
			`Args:`
			`data: the tensor or array to convert to numpy`

			`Returns:`
			`the resulting numpy array`

			`"""`
			`if isinstance(data, torch.Tensor):`
			`return data.cpu().detach().numpy()`
			`elif isinstance(data, numbers.Number):`
			`return np.array([data])`
			`elif isinstance(data, np.ndarray):`
			`return data`

			`raise TypeError("The given type ('%s') cannot be converted to a numpy array!" % type(data).__name__)`


			`def _numpy_metric_conversion(func_to_decorate: Callable) -> Callable:`
			`"""`
			`Decorator handling the argument conversion for metrics working on numpy.`
			`All inputs of the decorated function will be converted to numpy and all`
			`outputs will be converted to tensors.`

			`Args:`
			`func_to_decorate: the function whose inputs and outputs shall be converted`

			`Returns:`
			`the decorated function`

			`"""`
			`# applies collection conversion from tensor to numpy to all inputs`
			`# we need to include numpy arrays here, since otherwise they will also be treated as sequences`
			`func_convert_inputs = _apply_to_inputs(`
			`apply_to_collection, (torch.Tensor, np.ndarray, numbers.Number), _convert_to_numpy)(func_to_decorate)`
			`# converts all inputs back to tensors (device doesn't matter here, since this is handled by BaseMetric)`
			`func_convert_in_out = _apply_to_outputs(_convert_to_tensor)(func_convert_inputs)`
			`return func_convert_in_out`


			`def _tensor_metric_conversion(func_to_decorate: Callable) -> Callable:`
			`"""`
			`Decorator Handling the argument conversion for metrics working on tensors.`
			`All inputs and outputs of the decorated function will be converted to tensors`

			`Args:`
			`func_to_decorate: the function whose inputs and outputs shall be converted`

			`Returns:`
			`the decorated function`

			`"""`
			`# converts all inputs to tensor if possible`
			`# we need to include tensors here, since otherwise they will also be treated as sequences`
			`func_convert_inputs = _apply_to_inputs(`
			`apply_to_collection, (torch.Tensor, np.ndarray, numbers.Number), _convert_to_tensor)(func_to_decorate)`
			`# convert all outputs to tensor if possible`
			`return _apply_to_outputs(_convert_to_tensor)(func_convert_inputs)`


			`def _sync_ddp_if_available(result: Union[torch.Tensor],`
			`group: Optional[Any] = None,`
			`reduce_op: Optional[torch.distributed.ReduceOp] = None,`
			`) -> torch.Tensor:`
			`"""`
			`Function to reduce the tensors from several ddp processes to one master process`

			`Args:`
			`result: the value to sync and reduce (typically tensor or number)`
			`group: the process group to gather results from. Defaults to all processes (world)`
			`reduce_op: the reduction operation. Defaults to sum.`

			`Returns:`
			`reduced value`

			`"""`

			`if torch.distributed.is_available() and torch.distributed.is_initialized():`
			`if group is None:`
			`group = torch.distributed.group.WORLD`

			`if reduce_op is None:`
			`reduce_op = torch.distributed.ReduceOp.SUM`

			`# sync all processes before reduction`
			`torch.distributed.barrier(group=group)`
			`torch.distributed.all_reduce(result, op=reduce_op, group=group,`
			`async_op=False)`

			`return result`


			`def numpy_metric(group: Optional[Any] = None,`
			`reduce_op: Optional[torch.distributed.ReduceOp] = None) -> Callable:`
			`"""`
			`This decorator shall be used on all function metrics working on numpy arrays.`

			`It handles the argument conversion and DDP reduction for metrics working on numpy.`
			`All inputs of the decorated function will be converted to numpy and all`
			`outputs will be converted to tensors.`
			`In DDP Training all output tensors will be reduced according to the given rules.`

			`Args:`
			`group: the process group to gather results from. Defaults to all processes (world)`
			`reduce_op: the reduction operation. Defaults to sum`

			`Returns:`
			`the decorated function`

			`"""`

			`def decorator_fn(func_to_decorate):`
			`return _apply_to_outputs(apply_to_collection, torch.Tensor, _sync_ddp_if_available,`
			`group=group,`
			`reduce_op=reduce_op)(_numpy_metric_conversion(func_to_decorate))`

			`return decorator_fn`


			`def tensor_metric(group: Optional[Any] = None,`
			`reduce_op: Optional[torch.distributed.ReduceOp] = None) -> Callable:`
			`"""`
			`This decorator shall be used on all function metrics working on tensors.`

			`It handles the argument conversion and DDP reduction for metrics working on tensors.`
			`All inputs and outputs of the decorated function will be converted to tensors.`
			`In DDP Training all output tensors will be reduced according to the given rules.`

			`Args:`
			`group: the process group to gather results from. Defaults to all processes (world)`
			`reduce_op: the reduction operation. Defaults to sum`

			`Returns:`
			`the decorated function`

			`"""`

			`def decorator_fn(func_to_decorate):`
			`return _apply_to_outputs(apply_to_collection, torch.Tensor, _sync_ddp_if_available,`
			`group=group,`
			`reduce_op=reduce_op)(_tensor_metric_conversion(func_to_decorate))`

			`return decorator_fn`