Source code for imgaug.augmenters.edges

"""
Augmenters that deal with edge detection.

List of augmenters:

    * :class:`Canny`

:class:`~imgaug.augmenters.convolutional.EdgeDetect` and
:class:`~imgaug.augmenters.convolutional.DirectedEdgeDetect` are currently
still in ``convolutional.py``.

"""
from __future__ import print_function, division, absolute_import

from abc import ABCMeta, abstractmethod

import numpy as np
import cv2
import six

import imgaug as ia
from imgaug.imgaug import _normalize_cv2_input_arr_
from . import meta
from . import blend
from .. import parameters as iap
from .. import dtypes as iadt


# TODO this should be placed in some other file than edges.py as it could be
#      re-used wherever a binary image is the result
[docs]@six.add_metaclass(ABCMeta)
class IBinaryImageColorizer(object):
    """Interface for classes that convert binary masks to color images."""

[docs]    @abstractmethod
    def colorize(self, image_binary, image_original, nth_image, random_state):
        """
        Convert a binary image to a colorized one.

        Parameters
        ----------
        image_binary : ndarray
            Boolean ``(H,W)`` image.

        image_original : ndarray
            Original ``(H,W,C)`` input image.

        nth_image : int
            Index of the image in the batch.

        random_state : imgaug.random.RNG
            Random state to use.

        Returns
        -------
        ndarray
            Colorized form of `image_binary`.

        """


# TODO see above, this should be moved to another file
[docs]class RandomColorsBinaryImageColorizer(IBinaryImageColorizer):
    """
    Colorizer using two randomly sampled foreground/background colors.

    Parameters
    ----------
    color_true : int or tuple of int or list of int or imgaug.parameters.StochasticParameter, optional
        Color of the foreground, i.e. all pixels in binary images that are
        ``True``. This parameter will be queried once per image to
        generate ``(3,)`` samples denoting the color. (Note that even for
        grayscale images three values will be sampled and converted to
        grayscale according to ``0.299*R + 0.587*G + 0.114*B``. This is the
        same equation that is also used by OpenCV.)

            * If an int, exactly that value will always be used, i.e. every
              color will be ``(v, v, v)`` for value ``v``.
            * If a tuple ``(a, b)``, three random values from the range
              ``a <= x <= b`` will be sampled per image.
            * If a list, then three random values will be sampled from that
              list per image.
            * If a StochasticParameter, three values will be sampled from the
              parameter per image.

    color_false : int or tuple of int or list of int or imgaug.parameters.StochasticParameter, optional
        Analogous to `color_true`, but denotes the color for all pixels that
        are ``False`` in the binary input image.

    """

    def __init__(self, color_true=(0, 255), color_false=(0, 255)):
        self.color_true = iap.handle_discrete_param(
            color_true,
            "color_true",
            value_range=(0, 255),
            tuple_to_uniform=True,
            list_to_choice=True,
            allow_floats=False)

        self.color_false = iap.handle_discrete_param(
            color_false,
            "color_false",
            value_range=(0, 255),
            tuple_to_uniform=True,
            list_to_choice=True,
            allow_floats=False)

    def _draw_samples(self, random_state):
        color_true = self.color_true.draw_samples((3,),
                                                  random_state=random_state)
        color_false = self.color_false.draw_samples((3,),
                                                    random_state=random_state)
        return color_true, color_false

[docs]    def colorize(self, image_binary, image_original, nth_image, random_state):
        assert image_binary.ndim == 2, (
            "Expected binary image to colorize to be 2-dimensional, "
            "got %d dimensions." % (image_binary.ndim,))
        assert image_binary.dtype.kind == "b", (
            "Expected binary image to colorize to be boolean, "
            "got dtype kind %s." % (image_binary.dtype.kind,))
        assert image_original.ndim == 3, (
            "Expected original image to be 3-dimensional, got %d "
            "dimensions." % (image_original.ndim,))
        assert image_original.shape[-1] in [1, 3, 4], (
            "Expected original image to have 1, 3 or 4 channels. "
            "Got %d channels." % (image_original.shape[-1],))
        assert image_original.dtype.name == "uint8", (
            "Expected original image to have dtype uint8, got dtype %s." % (
                image_original.dtype.name))

        color_true, color_false = self._draw_samples(random_state)

        nb_channels = min(image_original.shape[-1], 3)
        image_colorized = np.zeros(
            (image_original.shape[0], image_original.shape[1], nb_channels),
            dtype=image_original.dtype)

        if nb_channels == 1:
            # single channel input image, convert colors to grayscale
            image_colorized[image_binary] = (
                0.299*color_true[0]
                + 0.587*color_true[1]
                + 0.114*color_true[2])
            image_colorized[~image_binary] = (
                0.299*color_false[0]
                + 0.587*color_false[1]
                + 0.114*color_false[2])
        else:
            image_colorized[image_binary] = color_true
            image_colorized[~image_binary] = color_false

        # re-attach alpha channel if it was present in input image
        if image_original.shape[-1] == 4:
            image_colorized = np.dstack(
                [image_colorized, image_original[:, :, 3:4]])

        return image_colorized

    def __str__(self):
        return ("RandomColorsBinaryImageColorizer("
                "color_true=%s, color_false=%s)") % (
                    self.color_true, self.color_false)


[docs]class Canny(meta.Augmenter):
    """
    Apply a canny edge detector to input images.

    **Supported dtypes**:

        * ``uint8``: yes; fully tested
        * ``uint16``: no; not tested
        * ``uint32``: no; not tested
        * ``uint64``: no; not tested
        * ``int8``: no; not tested
        * ``int16``: no; not tested
        * ``int32``: no; not tested
        * ``int64``: no; not tested
        * ``float16``: no; not tested
        * ``float32``: no; not tested
        * ``float64``: no; not tested
        * ``float128``: no; not tested
        * ``bool``: no; not tested

    Parameters
    ----------
    alpha : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
        Blending factor to use in alpha blending.
        A value close to 1.0 means that only the edge image is visible.
        A value close to 0.0 means that only the original image is visible.
        A value close to 0.5 means that the images are merged according to
        `0.5*image + 0.5*edge_image`.
        If a sample from this parameter is 0, no action will be performed for
        the corresponding image.

            * If an int or float, exactly that value will be used.
            * If a tuple ``(a, b)``, a random value from the range
              ``a <= x <= b`` will be sampled per image.
            * If a list, then a random value will be sampled from that list
              per image.
            * If a StochasticParameter, a value will be sampled from the
              parameter per image.

    hysteresis_thresholds : number or tuple of number or list of number or imgaug.parameters.StochasticParameter or tuple of tuple of number or tuple of list of number or tuple of imgaug.parameters.StochasticParameter, optional
        Min and max values to use in hysteresis thresholding.
        (This parameter seems to have not very much effect on the results.)
        Either a single parameter or a tuple of two parameters.
        If a single parameter is provided, the sampling happens once for all
        images with `(N,2)` samples being requested from the parameter,
        where each first value denotes the hysteresis minimum and each second
        the maximum.
        If a tuple of two parameters is provided, one sampling of `(N,)` values
        is independently performed per parameter (first parameter: hysteresis
        minimum, second: hysteresis maximum).

            * If this is a single number, both min and max value will always be
              exactly that value.
            * If this is a tuple of numbers ``(a, b)``, two random values from
              the range ``a <= x <= b`` will be sampled per image.
            * If this is a list, two random values will be sampled from that
              list per image.
            * If this is a StochasticParameter, two random values will be
              sampled from that parameter per image.
            * If this is a tuple ``(min, max)`` with ``min`` and ``max``
              both *not* being numbers, they will be treated according to the
              rules above (i.e. may be a number, tuple, list or
              StochasticParameter). A single value will be sampled per image
              and parameter.

    sobel_kernel_size : int or tuple of int or list of int or imgaug.parameters.StochasticParameter, optional
        Kernel size of the sobel operator initially applied to each image.
        This corresponds to ``apertureSize`` in ``cv2.Canny()``.
        If a sample from this parameter is ``<=1``, no action will be performed
        for the corresponding image.
        The maximum for this parameter is ``7`` (inclusive). Higher values are
        not accepted by OpenCV.
        If an even value ``v`` is sampled, it is automatically changed to
        ``v-1``.

            * If this is a single integer, the kernel size always matches that
              value.
            * If this is a tuple of integers ``(a, b)``, a random discrete
              value will be sampled from the range ``a <= x <= b`` per image.
            * If this is a list, a random value will be sampled from that
              list per image.
            * If this is a StochasticParameter, a random value will be sampled
              from that parameter per image.

    colorizer : None or imgaug.augmenters.edges.IBinaryImageColorizer, optional
        A strategy to convert binary edge images to color images.
        If this is ``None``, an instance of ``RandomColorBinaryImageColorizer``
        is created, which means that each edge image is converted into an
        ``uint8`` image, where edge and non-edge pixels each have a different
        color that was uniformly randomly sampled from the space of all
        ``uint8`` colors.

    seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
        See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.

    name : None or str, optional
        See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.

    random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
        Old name for parameter `seed`.
        Its usage will not yet cause a deprecation warning,
        but it is still recommended to use `seed` now.
        Outdated since 0.4.0.

    deterministic : bool, optional
        Deprecated since 0.4.0.
        See method ``to_deterministic()`` for an alternative and for
        details about what the "deterministic mode" actually does.

    Examples
    --------
    >>> import imgaug.augmenters as iaa
    >>> aug = iaa.Canny()

    Create an augmenter that generates random blends between images and
    their canny edge representations.

    >>> aug = iaa.Canny(alpha=(0.0, 0.5))

    Create a canny edge augmenter that generates edge images with a blending
    factor of max ``50%``, i.e. the original (non-edge) image is always at
    least partially visible.

    >>> aug = iaa.Canny(
    >>>     alpha=(0.0, 0.5),
    >>>     colorizer=iaa.RandomColorsBinaryImageColorizer(
    >>>         color_true=255,
    >>>         color_false=0
    >>>     )
    >>> )

    Same as in the previous example, but the edge image always uses the
    color white for edges and black for the background.

    >>> aug = iaa.Canny(alpha=(0.5, 1.0), sobel_kernel_size=[3, 7])

    Create a canny edge augmenter that initially preprocesses images using
    a sobel filter with kernel size of either ``3x3`` or ``13x13`` and
    alpha-blends with result using a strength of ``50%`` (both images
    equally visible) to ``100%`` (only edge image visible).

    >>> aug = iaa.Alpha(
    >>>     (0.0, 1.0),
    >>>     iaa.Canny(alpha=1),
    >>>     iaa.MedianBlur(13)
    >>> )

    Create an augmenter that blends a canny edge image with a median-blurred
    version of the input image. The median blur uses a fixed kernel size
    of ``13x13`` pixels.

    """

    def __init__(self,
                 alpha=(0.0, 1.0),
                 hysteresis_thresholds=((100-40, 100+40), (200-40, 200+40)),
                 sobel_kernel_size=(3, 7),
                 colorizer=None,
                 seed=None, name=None,
                 random_state="deprecated", deterministic="deprecated"):
        super(Canny, self).__init__(
            seed=seed, name=name,
            random_state=random_state, deterministic=deterministic)

        self.alpha = iap.handle_continuous_param(
            alpha, "alpha", value_range=(0, 1.0), tuple_to_uniform=True,
            list_to_choice=True)

        if isinstance(hysteresis_thresholds, tuple) \
                and len(hysteresis_thresholds) == 2 \
                and not ia.is_single_number(hysteresis_thresholds[0]) \
                and not ia.is_single_number(hysteresis_thresholds[1]):
            self.hysteresis_thresholds = (
                iap.handle_discrete_param(
                    hysteresis_thresholds[0],
                    "hysteresis_thresholds[0]",
                    value_range=(0, 255),
                    tuple_to_uniform=True,
                    list_to_choice=True,
                    allow_floats=True),
                iap.handle_discrete_param(
                    hysteresis_thresholds[1],
                    "hysteresis_thresholds[1]",
                    value_range=(0, 255),
                    tuple_to_uniform=True,
                    list_to_choice=True,
                    allow_floats=True)
            )
        else:
            self.hysteresis_thresholds = iap.handle_discrete_param(
                hysteresis_thresholds,
                "hysteresis_thresholds",
                value_range=(0, 255),
                tuple_to_uniform=True,
                list_to_choice=True,
                allow_floats=True)

        # we don't use handle_discrete_kernel_size_param() here, because
        # cv2.Canny() can't handle independent height/width values, only a
        # single kernel size
        self.sobel_kernel_size = iap.handle_discrete_param(
            sobel_kernel_size,
            "sobel_kernel_size",
            value_range=(0, 7),  # OpenCV only accepts ksize up to 7
            tuple_to_uniform=True,
            list_to_choice=True,
            allow_floats=False)

        self.colorizer = (
            colorizer
            if colorizer is not None
            else RandomColorsBinaryImageColorizer()
        )

    def _draw_samples(self, augmentables, random_state):
        nb_images = len(augmentables)
        rss = random_state.duplicate(4)

        alpha_samples = self.alpha.draw_samples((nb_images,), rss[0])

        hthresh = self.hysteresis_thresholds
        if isinstance(hthresh, tuple):
            min_values = hthresh[0].draw_samples((nb_images,), rss[1])
            max_values = hthresh[1].draw_samples((nb_images,), rss[2])
            hthresh_samples = np.stack([min_values, max_values], axis=-1)
        else:
            hthresh_samples = hthresh.draw_samples((nb_images, 2), rss[1])

        sobel_samples = self.sobel_kernel_size.draw_samples((nb_images,),
                                                            rss[3])

        # verify for hysteresis thresholds that min_value < max_value everywhere
        invalid = (hthresh_samples[:, 0] > hthresh_samples[:, 1])
        if np.any(invalid):
            hthresh_samples[invalid, :] = hthresh_samples[invalid, :][:, [1, 0]]

        # ensure that sobel kernel sizes are correct
        # note that OpenCV accepts only kernel sizes that are (a) even
        # and (b) <=7
        assert not np.any(sobel_samples < 0), (
            "Sampled a sobel kernel size below 0 in Canny. "
            "Allowed value range is 0 to 7.")
        assert not np.any(sobel_samples > 7), (
            "Sampled a sobel kernel size above 7 in Canny. "
            "Allowed value range is 0 to 7.")
        even_idx = (np.mod(sobel_samples, 2) == 0)
        sobel_samples[even_idx] -= 1

        return alpha_samples, hthresh_samples, sobel_samples

    # Added in 0.4.0.
    def _augment_batch_(self, batch, random_state, parents, hooks):
        if batch.images is None:
            return batch

        images = batch.images

        iadt.gate_dtypes(images,
                         allowed=["uint8"],
                         disallowed=[
                             "bool",
                             "uint16", "uint32", "uint64", "uint128",
                             "uint256",
                             "int8", "int16", "int32", "int64", "int128",
                             "int256",
                             "float32", "float64", "float96", "float128",
                             "float256"],
                         augmenter=self)

        rss = random_state.duplicate(len(images))
        samples = self._draw_samples(images, rss[-1])
        alpha_samples = samples[0]
        hthresh_samples = samples[1]
        sobel_samples = samples[2]

        gen = enumerate(zip(images, alpha_samples, hthresh_samples,
                            sobel_samples))
        for i, (image, alpha, hthreshs, sobel) in gen:
            assert image.shape[-1] in [1, 3, 4], (
                "Canny edge detector can currently only handle images with "
                "channel numbers that are 1, 3 or 4. Got %d.") % (
                    image.shape[-1],)

            has_zero_sized_axes = (0 in image.shape[0:2])
            if alpha > 0 and sobel > 1 and not has_zero_sized_axes:
                image_canny = cv2.Canny(
                    _normalize_cv2_input_arr_(image[:, :, 0:3]),
                    threshold1=hthreshs[0],
                    threshold2=hthreshs[1],
                    apertureSize=sobel,
                    L2gradient=True)
                image_canny = (image_canny > 0)

                # canny returns a boolean (H,W) image, so we change it to
                # (H,W,C) and then uint8
                image_canny_color = self.colorizer.colorize(
                    image_canny, image, nth_image=i, random_state=rss[i])

                batch.images[i] = blend.blend_alpha(image_canny_color, image,
                                                    alpha)

        return batch

[docs]    def get_parameters(self):
        """See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
        return [self.alpha, self.hysteresis_thresholds, self.sobel_kernel_size,
                self.colorizer]

    def __str__(self):
        return ("Canny("
                "alpha=%s, "
                "hysteresis_thresholds=%s, "
                "sobel_kernel_size=%s, "
                "colorizer=%s, "
                "name=%s, "
                "deterministic=%s)" % (
                    self.alpha, self.hysteresis_thresholds,
                    self.sobel_kernel_size, self.colorizer,
                    self.name, self.deterministic))