"""
Augmenters that perform simple arithmetic changes.
List of augmenters:
* :class:`Add`
* :class:`AddElementwise`
* :class:`AdditiveGaussianNoise`
* :class:`AdditiveLaplaceNoise`
* :class:`AdditivePoissonNoise`
* :class:`Multiply`
* :class:`MultiplyElementwise`
* :class:`Cutout`
* :class:`Dropout`
* :class:`CoarseDropout`
* :class:`Dropout2d`
* :class:`TotalDropout`
* :class:`ReplaceElementwise`
* :class:`ImpulseNoise`
* :class:`SaltAndPepper`
* :class:`CoarseSaltAndPepper`
* :class:`Salt`
* :class:`CoarseSalt`
* :class:`Pepper`
* :class:`CoarsePepper`
* :class:`Invert`
* :class:`Solarize`
* :class:`ContrastNormalization`
* :class:`JpegCompression`
"""
from __future__ import print_function, division, absolute_import
import tempfile
import imageio
import numpy as np
import imgaug as ia
from . import meta
from .. import parameters as iap
from .. import dtypes as iadt
from .. import random as iarandom
# fill modes for apply_cutout_() and Cutout augmenter
# contains roughly:
# 'str fill_mode_name => (str module_name, str function_name)'
# We could also assign the function to each fill mode name instead of its
# name, but that has the disadvantage that these aren't defined yet (they
# are defined further below) and that during unittesting they would be harder
# to mock. (mock.patch() seems to not automatically replace functions
# assigned in that way.)
_CUTOUT_FILL_MODES = {
"constant": ("imgaug.augmenters.arithmetic", "_fill_rectangle_constant_"),
"gaussian": ("imgaug.augmenters.arithmetic", "_fill_rectangle_gaussian_")
}
[docs]def add_scalar(image, value):
"""Add a single scalar value or one scalar value per channel to an image.
This method ensures that ``uint8`` does not overflow during the addition.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: limited; tested (1)
* ``uint32``: no
* ``uint64``: no
* ``int8``: limited; tested (1)
* ``int16``: limited; tested (1)
* ``int32``: no
* ``int64``: no
* ``float16``: limited; tested (1)
* ``float32``: limited; tested (1)
* ``float64``: no
* ``float128``: no
* ``bool``: limited; tested (1)
- (1) Non-uint8 dtypes can overflow. For floats, this can result
in +/-inf.
Parameters
----------
image : ndarray
Image array of shape ``(H,W,[C])``.
If `value` contains more than one value, the shape of the image is
expected to be ``(H,W,C)``.
value : number or ndarray
The value to add to the image. Either a single value or an array
containing exactly one component per channel, i.e. ``C`` components.
Returns
-------
ndarray
Image with value added to it.
"""
if image.size == 0:
return np.copy(image)
iadt.gate_dtypes(
image,
allowed=["bool",
"uint8", "uint16",
"int8", "int16",
"float16", "float32"],
disallowed=["uint32", "uint64", "uint128", "uint256",
"int32", "int64", "int128", "int256",
"float64", "float96", "float128",
"float256"],
augmenter=None)
if image.dtype.name == "uint8":
return _add_scalar_to_uint8(image, value)
return _add_scalar_to_non_uint8(image, value)
def _add_scalar_to_uint8(image, value):
# Using this LUT approach is significantly faster than using
# numpy-based adding with dtype checks (around 3-4x speedup) and is
# still faster than the simple numpy image+sample approach without LUT
# (about 10% at 64x64 and about 2x at 224x224 -- maybe dependent on
# installed BLAS libraries?)
# pylint: disable=no-else-return
is_single_value = (
ia.is_single_number(value)
or ia.is_np_scalar(value)
or (ia.is_np_array(value) and value.size == 1))
is_channelwise = not is_single_value
nb_channels = 1 if image.ndim == 2 else image.shape[-1]
value = np.clip(np.round(value), -255, 255).astype(np.int16)
value_range = np.arange(0, 256, dtype=np.int16)
if is_channelwise:
assert value.ndim == 1, (
"Expected `value` to be 1-dimensional, got %d-dimensional "
"data with shape %s." % (value.ndim, value.shape))
assert image.ndim == 3, (
"Expected `image` to be 3-dimensional when adding one value per "
"channel, got %d-dimensional data with shape %s." % (
image.ndim, image.shape))
assert image.shape[-1] == value.size, (
"Expected number of channels in `image` and number of components "
"in `value` to be identical. Got %d vs. %d." % (
image.shape[-1], value.size))
# TODO check if tile() is here actually needed
tables = np.tile(
value_range[:, np.newaxis],
(1, nb_channels)
) + value[np.newaxis, :]
else:
tables = value_range + value
tables = np.clip(tables, 0, 255).astype(image.dtype)
return ia.apply_lut(image, tables)
def _add_scalar_to_non_uint8(image, value):
input_dtype = image.dtype
is_single_value = (
ia.is_single_number(value)
or ia.is_np_scalar(value)
or (ia.is_np_array(value) and value.size == 1))
is_channelwise = not is_single_value
nb_channels = 1 if image.ndim == 2 else image.shape[-1]
shape = (1, 1, nb_channels if is_channelwise else 1)
value = np.array(value).reshape(shape)
# We limit here the value range of the value parameter to the
# bytes in the image's dtype. This prevents overflow problems
# and makes it less likely that the image has to be up-casted,
# which again improves performance and saves memory. Note that
# this also enables more dtypes for image inputs.
# The downside is that the mul parameter is limited in its
# value range.
#
# We need 2* the itemsize of the image here to allow to shift
# the image's max value to the lowest possible value, e.g. for
# uint8 it must allow for -255 to 255.
itemsize = image.dtype.itemsize * 2
dtype_target = np.dtype("%s%d" % (value.dtype.kind, itemsize))
value = iadt.clip_to_dtype_value_range_(
value, dtype_target, validate=True)
# Itemsize is currently reduced from 2 to 1 due to clip no
# longer supporting int64, which can cause issues with int32
# samples (32*2 = 64bit).
# TODO limit value ranges of samples to int16/uint16 for
# security
image, value = iadt.promote_array_dtypes_(
[image, value],
dtypes=[image.dtype, dtype_target],
increase_itemsize_factor=1)
image = np.add(image, value, out=image, casting="no")
return iadt.restore_dtypes_(image, input_dtype)
[docs]def add_elementwise(image, values):
"""Add an array of values to an image.
This method ensures that ``uint8`` does not overflow during the addition.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: limited; tested (1)
* ``uint32``: no
* ``uint64``: no
* ``int8``: limited; tested (1)
* ``int16``: limited; tested (1)
* ``int32``: no
* ``int64``: no
* ``float16``: limited; tested (1)
* ``float32``: limited; tested (1)
* ``float64``: no
* ``float128``: no
* ``bool``: limited; tested (1)
- (1) Non-uint8 dtypes can overflow. For floats, this can result
in +/-inf.
Parameters
----------
image : ndarray
Image array of shape ``(H,W,[C])``.
values : ndarray
The values to add to the image. Expected to have the same height
and width as `image` and either no channels or one channel or
the same number of channels as `image`.
Returns
-------
ndarray
Image with values added to it.
"""
iadt.gate_dtypes(
image,
allowed=["bool",
"uint8", "uint16",
"int8", "int16",
"float16", "float32"],
disallowed=["uint32", "uint64", "uint128", "uint256",
"int32", "int64", "int128", "int256",
"float64", "float96", "float128",
"float256"],
augmenter=None)
if image.dtype.name == "uint8":
return _add_elementwise_to_uint8(image, values)
return _add_elementwise_to_non_uint8(image, values)
def _add_elementwise_to_uint8(image, values):
# This special uint8 block is around 60-100% faster than the
# corresponding non-uint8 function further below (more speedup
# for smaller images).
#
# Also tested to instead compute min/max of image and value
# and then only convert image/value dtype if actually
# necessary, but that was like 20-30% slower, even for 224x224
# images.
#
if values.dtype.kind == "f":
values = np.round(values)
image = image.astype(np.int16)
values = np.clip(values, -255, 255).astype(np.int16)
image_aug = image + values
image_aug = np.clip(image_aug, 0, 255).astype(np.uint8)
return image_aug
def _add_elementwise_to_non_uint8(image, values):
# We limit here the value range of the value parameter to the
# bytes in the image's dtype. This prevents overflow problems
# and makes it less likely that the image has to be up-casted,
# which again improves performance and saves memory. Note that
# this also enables more dtypes for image inputs.
# The downside is that the mul parameter is limited in its
# value range.
#
# We need 2* the itemsize of the image here to allow to shift
# the image's max value to the lowest possible value, e.g. for
# uint8 it must allow for -255 to 255.
input_shape = image.shape
input_dtype = image.dtype
if image.ndim == 2:
image = image[..., np.newaxis]
if values.ndim == 2:
values = values[..., np.newaxis]
nb_channels = image.shape[-1]
itemsize = image.dtype.itemsize * 2
dtype_target = np.dtype("%s%d" % (values.dtype.kind, itemsize))
values = iadt.clip_to_dtype_value_range_(values, dtype_target,
validate=100)
if values.shape[2] == 1:
values = np.tile(values, (1, 1, nb_channels))
# Decreased itemsize from 2 to 1 here, see explanation in Add.
image, values = iadt.promote_array_dtypes_(
[image, values],
dtypes=[image.dtype, dtype_target],
increase_itemsize_factor=1)
image = np.add(image, values, out=image, casting="no")
image = iadt.restore_dtypes_(image, input_dtype)
if len(input_shape) == 2:
return image[..., 0]
return image
[docs]def multiply_scalar(image, multiplier):
"""Multiply an image by a single scalar or one scalar per channel.
This method ensures that ``uint8`` does not overflow during the
multiplication.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: limited; tested (1)
* ``uint32``: no
* ``uint64``: no
* ``int8``: limited; tested (1)
* ``int16``: limited; tested (1)
* ``int32``: no
* ``int64``: no
* ``float16``: limited; tested (1)
* ``float32``: limited; tested (1)
* ``float64``: no
* ``float128``: no
* ``bool``: limited; tested (1)
- (1) Non-uint8 dtypes can overflow. For floats, this can result in
+/-inf.
note::
Tests were only conducted for rather small multipliers, around
``-10.0`` to ``+10.0``.
In general, the multipliers sampled from `multiplier` must be in a
value range that corresponds to the input image's dtype. E.g. if the
input image has dtype ``uint16`` and the samples generated from
`multiplier` are ``float64``, this function will still force all
samples to be within the value range of ``float16``, as it has the
same number of bytes (two) as ``uint16``. This is done to make
overflows less likely to occur.
Parameters
----------
image : ndarray
Image array of shape ``(H,W,[C])``.
If `value` contains more than one value, the shape of the image is
expected to be ``(H,W,C)``.
multiplier : number or ndarray
The multiplier to use. Either a single value or an array
containing exactly one component per channel, i.e. ``C`` components.
Returns
-------
ndarray
Image, multiplied by `multiplier`.
"""
if image.size == 0:
return np.copy(image)
iadt.gate_dtypes(
image,
allowed=["bool",
"uint8", "uint16",
"int8", "int16",
"float16", "float32"],
disallowed=["uint32", "uint64", "uint128", "uint256",
"int32", "int64", "int128", "int256",
"float64", "float96", "float128",
"float256"],
augmenter=None)
if image.dtype.name == "uint8":
return _multiply_scalar_to_uint8(image, multiplier)
return _multiply_scalar_to_non_uint8(image, multiplier)
def _multiply_scalar_to_uint8(image, multiplier):
# Using this LUT approach is significantly faster than
# else-block code (more than 10x speedup) and is still faster
# than the simpler image*sample approach without LUT (1.5-3x
# speedup, maybe dependent on installed BLAS libraries?)
# pylint: disable=no-else-return
is_single_value = (
ia.is_single_number(multiplier)
or ia.is_np_scalar(multiplier)
or (ia.is_np_array(multiplier) and multiplier.size == 1))
is_channelwise = not is_single_value
nb_channels = 1 if image.ndim == 2 else image.shape[-1]
multiplier = np.float32(multiplier)
value_range = np.arange(0, 256, dtype=np.float32)
if is_channelwise:
assert multiplier.ndim == 1, (
"Expected `multiplier` to be 1-dimensional, got %d-dimensional "
"data with shape %s." % (multiplier.ndim, multiplier.shape))
assert image.ndim == 3, (
"Expected `image` to be 3-dimensional when multiplying by one "
"value per channel, got %d-dimensional data with shape %s." % (
image.ndim, image.shape))
assert image.shape[-1] == multiplier.size, (
"Expected number of channels in `image` and number of components "
"in `multiplier` to be identical. Got %d vs. %d." % (
image.shape[-1], multiplier.size))
# TODO check if tile() is here actually needed
tables = np.tile(
value_range[:, np.newaxis],
(1, nb_channels)
) * multiplier[np.newaxis, :]
else:
tables = value_range * multiplier
tables = np.clip(tables, 0, 255).astype(image.dtype)
return ia.apply_lut(image, tables)
def _multiply_scalar_to_non_uint8(image, multiplier):
# TODO estimate via image min/max values whether a resolution
# increase is necessary
input_dtype = image.dtype
is_single_value = (
ia.is_single_number(multiplier)
or ia.is_np_scalar(multiplier)
or (ia.is_np_array(multiplier) and multiplier.size == 1))
is_channelwise = not is_single_value
nb_channels = 1 if image.ndim == 2 else image.shape[-1]
shape = (1, 1, nb_channels if is_channelwise else 1)
multiplier = np.array(multiplier).reshape(shape)
# deactivated itemsize increase due to clip causing problems
# with int64, see Add
# mul_min = np.min(mul)
# mul_max = np.max(mul)
# is_not_increasing_value_range = (
# (-1 <= mul_min <= 1)
# and (-1 <= mul_max <= 1))
# We limit here the value range of the mul parameter to the
# bytes in the image's dtype. This prevents overflow problems
# and makes it less likely that the image has to be up-casted,
# which again improves performance and saves memory. Note that
# this also enables more dtypes for image inputs.
# The downside is that the mul parameter is limited in its
# value range.
itemsize = max(
image.dtype.itemsize,
2 if multiplier.dtype.kind == "f" else 1
) # float min itemsize is 2 not 1
dtype_target = np.dtype("%s%d" % (multiplier.dtype.kind, itemsize))
multiplier = iadt.clip_to_dtype_value_range_(
multiplier, dtype_target, validate=True)
image, multiplier = iadt.promote_array_dtypes_(
[image, multiplier],
dtypes=[image.dtype, dtype_target],
# increase_itemsize_factor=(
# 1 if is_not_increasing_value_range else 2)
increase_itemsize_factor=1
)
image = np.multiply(image, multiplier, out=image, casting="no")
return iadt.restore_dtypes_(image, input_dtype)
[docs]def multiply_elementwise(image, multipliers):
"""Multiply an image with an array of values.
This method ensures that ``uint8`` does not overflow during the addition.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: limited; tested (1)
* ``uint32``: no
* ``uint64``: no
* ``int8``: limited; tested (1)
* ``int16``: limited; tested (1)
* ``int32``: no
* ``int64``: no
* ``float16``: limited; tested (1)
* ``float32``: limited; tested (1)
* ``float64``: no
* ``float128``: no
* ``bool``: limited; tested (1)
- (1) Non-uint8 dtypes can overflow. For floats, this can result
in +/-inf.
note::
Tests were only conducted for rather small multipliers, around
``-10.0`` to ``+10.0``.
In general, the multipliers sampled from `multipliers` must be in a
value range that corresponds to the input image's dtype. E.g. if the
input image has dtype ``uint16`` and the samples generated from
`multipliers` are ``float64``, this function will still force all
samples to be within the value range of ``float16``, as it has the
same number of bytes (two) as ``uint16``. This is done to make
overflows less likely to occur.
Parameters
----------
image : ndarray
Image array of shape ``(H,W,[C])``.
multipliers : ndarray
The multipliers with which to multiply the image. Expected to have
the same height and width as `image` and either no channels or one
channel or the same number of channels as `image`.
Returns
-------
ndarray
Image, multiplied by `multipliers`.
"""
iadt.gate_dtypes(
image,
allowed=["bool",
"uint8", "uint16",
"int8", "int16",
"float16", "float32"],
disallowed=["uint32", "uint64", "uint128", "uint256",
"int32", "int64", "int128", "int256",
"float64", "float96", "float128", "float256"],
augmenter=None)
if multipliers.dtype.kind == "b":
# TODO extend this with some shape checks
image *= multipliers
return image
if image.dtype.name == "uint8":
return _multiply_elementwise_to_uint8(image, multipliers)
return _multiply_elementwise_to_non_uint8(image, multipliers)
def _multiply_elementwise_to_uint8(image, multipliers):
# This special uint8 block is around 60-100% faster than the
# non-uint8 block further below (more speedup for larger images).
if multipliers.dtype.kind == "f":
# interestingly, float32 is here significantly faster than
# float16
# TODO is that system dependent?
# TODO does that affect int8-int32 too?
multipliers = multipliers.astype(np.float32, copy=False)
image_aug = image.astype(np.float32)
else:
multipliers = multipliers.astype(np.int16, copy=False)
image_aug = image.astype(np.int16)
image_aug = np.multiply(image_aug, multipliers, casting="no", out=image_aug)
return iadt.restore_dtypes_(image_aug, np.uint8, round=False)
def _multiply_elementwise_to_non_uint8(image, multipliers):
input_dtype = image.dtype
# TODO maybe introduce to stochastic parameters some way to
# get the possible min/max values, could make things
# faster for dropout to get 0/1 min/max from the binomial
# itemsize decrease is currently deactivated due to issues
# with clip and int64, see Add
mul_min = np.min(multipliers)
mul_max = np.max(multipliers)
# is_not_increasing_value_range = (
# (-1 <= mul_min <= 1) and (-1 <= mul_max <= 1))
# We limit here the value range of the mul parameter to the
# bytes in the image's dtype. This prevents overflow problems
# and makes it less likely that the image has to be up-casted,
# which again improves performance and saves memory. Note that
# this also enables more dtypes for image inputs.
# The downside is that the mul parameter is limited in its
# value range.
itemsize = max(
image.dtype.itemsize,
2 if multipliers.dtype.kind == "f" else 1
) # float min itemsize is 2
dtype_target = np.dtype("%s%d" % (multipliers.dtype.kind, itemsize))
multipliers = iadt.clip_to_dtype_value_range_(
multipliers, dtype_target,
validate=True, validate_values=(mul_min, mul_max))
if multipliers.shape[2] == 1:
# TODO check if tile() is here actually needed
nb_channels = image.shape[-1]
multipliers = np.tile(multipliers, (1, 1, nb_channels))
image, multipliers = iadt.promote_array_dtypes_(
[image, multipliers],
dtypes=[image, dtype_target],
increase_itemsize_factor=1
# increase_itemsize_factor=(
# 1 if is_not_increasing_value_range else 2)
)
image = np.multiply(image, multipliers, out=image, casting="no")
return iadt.restore_dtypes_(image, input_dtype)
[docs]def cutout(image, x1, y1, x2, y2,
fill_mode="constant", cval=0, fill_per_channel=False,
seed=None):
"""Fill a single area within an image using a fill mode.
This cutout method uses the top-left and bottom-right corner coordinates
of the cutout region given as absolute pixel values.
.. note::
Gaussian fill mode will assume that float input images contain values
in the interval ``[0.0, 1.0]`` and hence sample values from a
gaussian within that interval, i.e. from ``N(0.5, std=0.5/3)``.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
Added in 0.4.0.
Parameters
----------
image : ndarray
Image to modify.
x1 : number
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
y1 : number
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
x2 : number
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
y2 : number
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
fill_mode : {'constant', 'gaussian'}, optional
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
cval : number or tuple of number, optional
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
fill_per_channel : number or bool, optional
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
Returns
-------
ndarray
Image with area filled in.
"""
return cutout_(np.copy(image),
x1, y1, x2, y2,
fill_mode, cval, fill_per_channel, seed)
[docs]def cutout_(image, x1, y1, x2, y2,
fill_mode="constant", cval=0, fill_per_channel=False,
seed=None):
"""Fill a single area within an image using a fill mode (in-place).
This cutout method uses the top-left and bottom-right corner coordinates
of the cutout region given as absolute pixel values.
.. note::
Gaussian fill mode will assume that float input images contain values
in the interval ``[0.0, 1.0]`` and hence sample values from a
gaussian within that interval, i.e. from ``N(0.5, std=0.5/3)``.
Added in 0.4.0.
**Supported dtypes**:
minimum of (
:func:`~imgaug.augmenters.arithmetic._fill_rectangle_gaussian_`,
:func:`~imgaug.augmenters.arithmetic._fill_rectangle_constant_`
)
Parameters
----------
image : ndarray
Image to modify. Might be modified in-place.
x1 : number
X-coordinate of the top-left corner of the cutout region.
y1 : number
Y-coordinate of the top-left corner of the cutout region.
x2 : number
X-coordinate of the bottom-right corner of the cutout region.
y2 : number
Y-coordinate of the bottom-right corner of the cutout region.
fill_mode : {'constant', 'gaussian'}, optional
Fill mode to use.
cval : number or tuple of number, optional
The constant value to use when filling with mode ``constant``.
May be an intensity value or color tuple.
fill_per_channel : number or bool, optional
Whether to fill in a channelwise fashion.
If number then a value ``>=0.5`` will be interpreted as ``True``.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
A random number generator to sample random values from.
Usually an integer seed value or an ``RNG`` instance.
See :class:`imgaug.random.RNG` for details.
Returns
-------
ndarray
Image with area filled in.
The input image might have been modified in-place.
"""
import importlib
height, width = image.shape[0:2]
x1 = min(max(int(x1), 0), width)
y1 = min(max(int(y1), 0), height)
x2 = min(max(int(x2), 0), width)
y2 = min(max(int(y2), 0), height)
if x2 > x1 and y2 > y1:
assert fill_mode in _CUTOUT_FILL_MODES, (
"Expected one of the following fill modes: %s. "
"Got: %s." % (
str(list(_CUTOUT_FILL_MODES.keys())), fill_mode))
module_name, fname = _CUTOUT_FILL_MODES[fill_mode]
module = importlib.import_module(module_name)
func = getattr(module, fname)
image = func(
image,
x1=x1, y1=y1, x2=x2, y2=y2,
cval=cval,
per_channel=(fill_per_channel >= 0.5),
random_state=(
iarandom.RNG(seed)
if not isinstance(seed, iarandom.RNG)
else seed) # only RNG(.) without "if" is ~8x slower
)
return image
def _fill_rectangle_gaussian_(image, x1, y1, x2, y2, cval, per_channel,
random_state):
"""Fill a rectangular image area with samples from a gaussian.
Added in 0.4.0.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: yes; tested
* ``uint32``: yes; tested
* ``uint64``: limited; tested (1)
* ``int8``: yes; tested
* ``int16``: yes; tested
* ``int32``: yes; tested
* ``int64``: limited; tested (1)
* ``float16``: yes; tested (2)
* ``float32``: yes; tested (2)
* ``float64``: yes; tested (2)
* ``float128``: limited; tested (1) (2)
* ``bool``: yes; tested
- (1) Possible loss of resolution due to gaussian values being sampled
as ``float64`` s.
- (2) Float input arrays are assumed to be in interval ``[0.0, 1.0]``
and all gaussian samples are within that interval too.
"""
# for float we assume value range [0.0, 1.0]
# that matches the common use case and also makes the tests way easier
# we also set bool here manually as the center value returned by
# get_value_range_for_dtype() is None
kind = image.dtype.kind
if kind in ["f", "b"]:
min_value = 0.0
center_value = 0.5
max_value = 1.0
else:
min_value, center_value, max_value = iadt.get_value_range_of_dtype(
image.dtype)
# set standard deviation to 1/3 of value range to get 99.7% of values
# within [min v.r., max v.r.]
# we also divide by 2 because we want to spread towards the
# "left"/"right" of the center value by half of the value range
stddev = (float(max_value) - float(min_value)) / 2.0 / 3.0
height = y2 - y1
width = x2 - x1
shape = (height, width)
if per_channel and image.ndim == 3:
shape = shape + (image.shape[2],)
rect = random_state.normal(center_value, stddev, size=shape)
if image.dtype.kind == "b":
rect_vr = (rect > 0.5)
else:
rect_vr = np.clip(rect, min_value, max_value).astype(image.dtype)
if image.ndim == 3:
image[y1:y2, x1:x2, :] = np.atleast_3d(rect_vr)
else:
image[y1:y2, x1:x2] = rect_vr
return image
def _fill_rectangle_constant_(image, x1, y1, x2, y2, cval, per_channel,
random_state):
"""Fill a rectangular area within an image with constant value(s).
`cval` may be a single value or one per channel. If the number of items
in `cval` does not match the number of channels in `image`, it may
be tiled up to the number of channels.
Added in 0.4.0.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: yes; tested
* ``uint32``: yes; tested
* ``uint64``: yes; tested
* ``int8``: yes; tested
* ``int16``: yes; tested
* ``int32``: yes; tested
* ``int64``: yes; tested
* ``float16``: yes; tested
* ``float32``: yes; tested
* ``float64``: yes; tested
* ``float128``: yes; tested
* ``bool``: yes; tested
"""
if ia.is_iterable(cval):
if per_channel:
nb_channels = None if image.ndim == 2 else image.shape[-1]
if nb_channels is None:
cval = cval[0]
elif len(cval) < nb_channels:
mul = int(np.ceil(nb_channels / len(cval)))
cval = np.tile(cval, (mul,))[0:nb_channels]
elif len(cval) > nb_channels:
cval = cval[0:nb_channels]
else:
cval = cval[0]
# without the array(), uint64 max value is assigned as 0
image[y1:y2, x1:x2, ...] = np.array(cval, dtype=image.dtype)
return image
[docs]def replace_elementwise_(image, mask, replacements):
"""Replace components in an image array with new values.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: yes; tested
* ``uint32``: yes; tested
* ``uint64``: no (1)
* ``int8``: yes; tested
* ``int16``: yes; tested
* ``int32``: yes; tested
* ``int64``: no (2)
* ``float16``: yes; tested
* ``float32``: yes; tested
* ``float64``: yes; tested
* ``float128``: no
* ``bool``: yes; tested
- (1) ``uint64`` is currently not supported, because
:func:`~imgaug.dtypes.clip_to_dtype_value_range_()` does not
support it, which again is because numpy.clip() seems to not
support it.
- (2) `int64` is disallowed due to being converted to `float64`
by :func:`numpy.clip` since 1.17 (possibly also before?).
Parameters
----------
image : ndarray
Image array of shape ``(H,W,[C])``.
mask : ndarray
Mask of shape ``(H,W,[C])`` denoting which components to replace.
If ``C`` is provided, it must be ``1`` or match the ``C`` of `image`.
May contain floats in the interval ``[0.0, 1.0]``.
replacements : iterable
Replacements to place in `image` at the locations defined by `mask`.
This 1-dimensional iterable must contain exactly as many values
as there are replaced components in `image`.
Returns
-------
ndarray
Image with replaced components.
"""
iadt.gate_dtypes(
image,
allowed=["bool",
"uint8", "uint16", "uint32",
"int8", "int16", "int32",
"float16", "float32", "float64"],
disallowed=["uint64", "uint128", "uint256",
"int64", "int128", "int256",
"float96", "float128", "float256"],
augmenter=None)
# This is slightly faster (~20%) for masks that are True at many
# locations, but slower (~50%) for masks with few Trues, which is
# probably the more common use-case:
#
# replacement_samples = self.replacement.draw_samples(
# sampling_shape, random_state=rs_replacement)
#
# # round, this makes 0.2 e.g. become 0 in case of boolean
# # image (otherwise replacing values with 0.2 would
# # lead to True instead of False).
# if (image.dtype.kind in ["i", "u", "b"]
# and replacement_samples.dtype.kind == "f"):
# replacement_samples = np.round(replacement_samples)
#
# replacement_samples = iadt.clip_to_dtype_value_range_(
# replacement_samples, image.dtype, validate=False)
# replacement_samples = replacement_samples.astype(
# image.dtype, copy=False)
#
# if sampling_shape[2] == 1:
# mask_samples = np.tile(mask_samples, (1, 1, nb_channels))
# replacement_samples = np.tile(
# replacement_samples, (1, 1, nb_channels))
# mask_thresh = mask_samples > 0.5
# image[mask_thresh] = replacement_samples[mask_thresh]
input_shape = image.shape
if image.ndim == 2:
image = image[..., np.newaxis]
if mask.ndim == 2:
mask = mask[..., np.newaxis]
mask_thresh = mask > 0.5
if mask.shape[2] == 1:
nb_channels = image.shape[-1]
# TODO verify if tile() is here really necessary
mask_thresh = np.tile(mask_thresh, (1, 1, nb_channels))
# round, this makes 0.2 e.g. become 0 in case of boolean
# image (otherwise replacing values with 0.2 would lead to True
# instead of False).
if image.dtype.kind in ["i", "u", "b"] and replacements.dtype.kind == "f":
replacements = np.round(replacements)
replacement_samples = iadt.clip_to_dtype_value_range_(
replacements, image.dtype, validate=False)
replacement_samples = replacement_samples.astype(image.dtype, copy=False)
image[mask_thresh] = replacement_samples
if len(input_shape) == 2:
return image[..., 0]
return image
[docs]def invert(image, min_value=None, max_value=None, threshold=None,
invert_above_threshold=True):
"""Invert an array.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.invert_`.
Parameters
----------
image : ndarray
See :func:`invert_`.
min_value : None or number, optional
See :func:`invert_`.
max_value : None or number, optional
See :func:`invert_`.
threshold : None or number, optional
See :func:`invert_`.
invert_above_threshold : bool, optional
See :func:`invert_`.
Returns
-------
ndarray
Inverted image.
"""
return invert_(np.copy(image), min_value=min_value, max_value=max_value,
threshold=threshold,
invert_above_threshold=invert_above_threshold)
[docs]def invert_(image, min_value=None, max_value=None, threshold=None,
invert_above_threshold=True):
"""Invert an array in-place.
Added in 0.4.0.
**Supported dtypes**:
if (min_value=None and max_value=None):
* ``uint8``: yes; fully tested
* ``uint16``: yes; tested
* ``uint32``: yes; tested
* ``uint64``: yes; tested
* ``int8``: yes; tested
* ``int16``: yes; tested
* ``int32``: yes; tested
* ``int64``: yes; tested
* ``float16``: yes; tested
* ``float32``: yes; tested
* ``float64``: yes; tested
* ``float128``: yes; tested
* ``bool``: yes; tested
if (min_value!=None or max_value!=None):
* ``uint8``: yes; fully tested
* ``uint16``: yes; tested
* ``uint32``: yes; tested
* ``uint64``: no (1)
* ``int8``: yes; tested
* ``int16``: yes; tested
* ``int32``: yes; tested
* ``int64``: no (2)
* ``float16``: yes; tested
* ``float32``: yes; tested
* ``float64``: no (2)
* ``float128``: no (3)
* ``bool``: no (4)
- (1) Not allowed due to numpy's clip converting from ``uint64`` to
``float64``.
- (2) Not allowed as int/float have to be increased in resolution
when using min/max values.
- (3) Not tested.
- (4) Makes no sense when using min/max values.
Parameters
----------
image : ndarray
Image array of shape ``(H,W,[C])``.
The array *might* be modified in-place.
min_value : None or number, optional
Minimum of the value range of input images, e.g. ``0`` for ``uint8``
images. If set to ``None``, the value will be automatically derived
from the image's dtype.
max_value : None or number, optional
Maximum of the value range of input images, e.g. ``255`` for ``uint8``
images. If set to ``None``, the value will be automatically derived
from the image's dtype.
threshold : None or number, optional
A threshold to use in order to invert only numbers above or below
the threshold. If ``None`` no thresholding will be used.
invert_above_threshold : bool, optional
If ``True``, only values ``>=threshold`` will be inverted.
Otherwise, only values ``<threshold`` will be inverted.
If `threshold` is ``None`` this parameter has no effect.
Returns
-------
ndarray
Inverted image. This *can* be the same array as input in `image`,
modified in-place.
"""
# when no custom min/max are chosen, all bool, uint, int and float dtypes
# should be invertable (float tested only up to 64bit)
# when chosing custom min/max:
# - bool makes no sense, not allowed
# - int and float must be increased in resolution if custom min/max values
# are chosen, hence they are limited to 32 bit and below
# - uint64 is converted by numpy's clip to float64, hence loss of accuracy
# - float16 seems to not be perfectly accurate, but still ok-ish -- was
# off by 10 for center value of range (float 16 min, 16), where float
# 16 min is around -65500
allow_dtypes_custom_minmax = {"uint8", "uint16", "uint32",
"int8", "int16", "int32",
"float16", "float32"}
min_value_dt, _, max_value_dt = \
iadt.get_value_range_of_dtype(image.dtype)
min_value = (min_value_dt
if min_value is None else min_value)
max_value = (max_value_dt
if max_value is None else max_value)
assert min_value >= min_value_dt, (
"Expected min_value to be above or equal to dtype's min "
"value, got %s (vs. min possible %s for %s)" % (
str(min_value), str(min_value_dt), image.dtype.name)
)
assert max_value <= max_value_dt, (
"Expected max_value to be below or equal to dtype's max "
"value, got %s (vs. max possible %s for %s)" % (
str(max_value), str(max_value_dt), image.dtype.name)
)
assert min_value < max_value, (
"Expected min_value to be below max_value, got %s "
"and %s" % (
str(min_value), str(max_value))
)
if min_value != min_value_dt or max_value != max_value_dt:
assert image.dtype.name in allow_dtypes_custom_minmax, (
"Can use custom min/max values only with the following "
"dtypes: %s. Got: %s." % (
", ".join(allow_dtypes_custom_minmax), image.dtype.name))
if image.dtype.name == "uint8":
return _invert_uint8_(image, min_value, max_value, threshold,
invert_above_threshold)
dtype_kind_to_invert_func = {
"b": _invert_bool,
"u": _invert_uint16_or_larger_, # uint8 handled above
"i": _invert_int_,
"f": _invert_float
}
func = dtype_kind_to_invert_func[image.dtype.kind]
if threshold is None:
return func(image, min_value, max_value)
arr_inv = func(np.copy(image), min_value, max_value)
if invert_above_threshold:
mask = (image >= threshold)
else:
mask = (image < threshold)
image[mask] = arr_inv[mask]
return image
def _invert_bool(arr, min_value, max_value):
assert min_value == 0 and max_value == 1, (
"min_value and max_value must be 0 and 1 for bool arrays. "
"Got %.4f and %.4f." % (min_value, max_value))
return ~arr
# Added in 0.4.0.
def _invert_uint8_(arr, min_value, max_value, threshold,
invert_above_threshold):
table = _generate_table_for_invert_uint8(
min_value, max_value, threshold, invert_above_threshold)
arr = ia.apply_lut_(arr, table)
return arr
# Added in 0.4.0.
def _invert_uint16_or_larger_(arr, min_value, max_value):
min_max_is_vr = (min_value == 0
and max_value == np.iinfo(arr.dtype).max)
if min_max_is_vr:
return max_value - arr
return _invert_by_distance(
np.clip(arr, min_value, max_value),
min_value, max_value
)
# Added in 0.4.0.
def _invert_int_(arr, min_value, max_value):
# note that for int dtypes the max value is
# (-1) * min_value - 1
# e.g. -128 and 127 (min/max) for int8
# mapping example:
# [-4, -3, -2, -1, 0, 1, 2, 3]
# will be mapped to
# [ 3, 2, 1, 0, -1, -2, -3, -4]
# hence we can not simply compute the inverse as:
# after = (-1) * before
# but instead need
# after = (-1) * before - 1
# however, this exceeds the value range for the minimum value, e.g.
# for int8: -128 -> 128 -> 127, where 128 exceeds it. Hence, we must
# compute the inverse via a mask (extra step for the minimum)
# or we have to increase the resolution of the array. Here, a
# two-step approach is used.
if min_value == (-1) * max_value - 1:
arr_inv = np.copy(arr)
mask = (arr_inv == min_value)
# there is probably a one-liner here to do this, but
# ((-1) * (arr_inv * ~mask) - 1) + mask * max_value
# has the disadvantage of inverting min_value to max_value - 1
# while
# ((-1) * (arr_inv * ~mask) - 1) + mask * (max_value+1)
# ((-1) * (arr_inv * ~mask) - 1) + mask * max_value + mask
# both sometimes increase the dtype resolution (e.g. int32 to int64)
arr_inv[mask] = max_value
arr_inv[~mask] = (-1) * arr_inv[~mask] - 1
return arr_inv
return _invert_by_distance(
np.clip(arr, min_value, max_value),
min_value, max_value
)
def _invert_float(arr, min_value, max_value):
if np.isclose(max_value, (-1)*min_value, rtol=0):
return (-1) * arr
return _invert_by_distance(
np.clip(arr, min_value, max_value),
min_value, max_value
)
def _invert_by_distance(arr, min_value, max_value):
arr_inv = arr
if arr.dtype.kind in ["i", "f"]:
arr_inv = iadt.increase_array_resolutions_([np.copy(arr)], 2)[0]
distance_from_min = np.abs(arr_inv - min_value) # d=abs(v-min)
arr_inv = max_value - distance_from_min # v'=MAX-d
# due to floating point inaccuracies, we might exceed the min/max
# values for floats here, hence clip this happens especially for
# values close to the float dtype's maxima
if arr.dtype.kind == "f":
arr_inv = np.clip(arr_inv, min_value, max_value)
if arr.dtype.kind in ["i", "f"]:
arr_inv = iadt.restore_dtypes_(
arr_inv, arr.dtype, clip=False)
return arr_inv
# Added in 0.4.0.
def _generate_table_for_invert_uint8(min_value, max_value, threshold,
invert_above_threshold):
table = np.arange(256).astype(np.int32)
full_value_range = (min_value == 0 and max_value == 255)
if full_value_range:
table_inv = table[::-1]
else:
distance_from_min = np.abs(table - min_value)
table_inv = max_value - distance_from_min
table_inv = np.clip(table_inv, min_value, max_value).astype(np.uint8)
if threshold is not None:
table = table.astype(np.uint8)
if invert_above_threshold:
table_inv = np.concatenate([
table[0:int(threshold)],
table_inv[int(threshold):]
], axis=0)
else:
table_inv = np.concatenate([
table_inv[0:int(threshold)],
table[int(threshold):]
], axis=0)
return table_inv
[docs]def solarize(image, threshold=128):
"""Invert pixel values above a threshold.
Added in 0.4.0.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.solarize_`.
Parameters
----------
image : ndarray
See :func:`solarize_`.
threshold : None or number, optional
See :func:`solarize_`.
Returns
-------
ndarray
Inverted image.
"""
return solarize_(np.copy(image), threshold=threshold)
[docs]def solarize_(image, threshold=128):
"""Invert pixel values above a threshold in-place.
This function is a wrapper around :func:`invert`.
This function performs the same transformation as
:func:`PIL.ImageOps.solarize`.
Added in 0.4.0.
**Supported dtypes**:
See ``~imgaug.augmenters.arithmetic.invert_(min_value=None and max_value=None)``.
Parameters
----------
image : ndarray
See :func:`invert_`.
threshold : None or number, optional
See :func:`invert_`.
Note: The default threshold is optimized for ``uint8`` images.
Returns
-------
ndarray
Inverted image. This *can* be the same array as input in `image`,
modified in-place.
"""
return invert_(image, threshold=threshold)
[docs]def compress_jpeg(image, compression):
"""Compress an image using jpeg compression.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: ?
* ``uint32``: ?
* ``uint64``: ?
* ``int8``: ?
* ``int16``: ?
* ``int32``: ?
* ``int64``: ?
* ``float16``: ?
* ``float32``: ?
* ``float64``: ?
* ``float128``: ?
* ``bool``: ?
Parameters
----------
image : ndarray
Image of dtype ``uint8`` and shape ``(H,W,[C])``. If ``C`` is provided,
it must be ``1`` or ``3``.
compression : int
Strength of the compression in the interval ``[0, 100]``.
Returns
-------
ndarray
Input image after applying jpeg compression to it and reloading
the result into a new array. Same shape and dtype as the input.
"""
import PIL.Image
if image.size == 0:
return np.copy(image)
# The value range 1 to 95 is suggested by PIL's save() documentation
# Values above 95 seem to not make sense (no improvement in visual
# quality, but large file size).
# A value of 100 would mostly deactivate jpeg compression.
# A value of 0 would lead to no compression (instead of maximum
# compression).
# We use range 1 to 100 here, because this augmenter is about
# generating images for training and not for saving, hence we do not
# care about large file sizes.
maximum_quality = 100
minimum_quality = 1
assert image.dtype.name == "uint8", (
"Jpeg compression can only be applied to uint8 images. "
"Got dtype %s." % (image.dtype.name,))
assert 0 <= compression <= 100, (
"Expected compression to be in the interval [0, 100], "
"got %.4f." % (compression,))
has_no_channels = (image.ndim == 2)
is_single_channel = (image.ndim == 3 and image.shape[-1] == 1)
if is_single_channel:
image = image[..., 0]
assert has_no_channels or is_single_channel or image.shape[-1] == 3, (
"Expected either a grayscale image of shape (H,W) or (H,W,1) or an "
"RGB image of shape (H,W,3). Got shape %s." % (image.shape,))
# Map from compression to quality used by PIL
# We have valid compressions from 0 to 100, i.e. 101 possible
# values
quality = int(
np.clip(
np.round(
minimum_quality
+ (maximum_quality - minimum_quality)
* (1.0 - (compression / 101))
),
minimum_quality,
maximum_quality
)
)
image_pil = PIL.Image.fromarray(image)
with tempfile.NamedTemporaryFile(mode="wb+", suffix=".jpg") as f:
image_pil.save(f, quality=quality)
# Read back from file.
# We dont read from f.name, because that leads to PermissionDenied
# errors on Windows. We add f.seek(0) here, because otherwise we get
# `SyntaxError: index out of range` in PIL.
f.seek(0)
pilmode = "RGB"
if has_no_channels or is_single_channel:
pilmode = "L"
image = imageio.imread(f, pilmode=pilmode, format="jpeg")
if is_single_channel:
image = image[..., np.newaxis]
return image
[docs]class Add(meta.Augmenter):
"""
Add a value to all pixels in an image.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.add_scalar`.
Parameters
----------
value : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
Value to add to all pixels.
* If a number, exactly that value will always be used.
* If a tuple ``(a, b)``, then a value from the discrete
interval ``[a..b]`` will be sampled per image.
* If a list, then a random value will be sampled from that list
per image.
* If a ``StochasticParameter``, then a value will be sampled per
image from that parameter.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Add(10)
Always adds a value of 10 to all channels of all pixels of all input
images.
>>> aug = iaa.Add((-10, 10))
Adds a value from the discrete interval ``[-10..10]`` to all pixels of
input images. The exact value is sampled per image.
>>> aug = iaa.Add((-10, 10), per_channel=True)
Adds a value from the discrete interval ``[-10..10]`` to all pixels of
input images. The exact value is sampled per image *and* channel,
i.e. to a red-channel it might add 5 while subtracting 7 from the
blue channel of the same image.
>>> aug = iaa.Add((-10, 10), per_channel=0.5)
Identical to the previous example, but the `per_channel` feature is only
active for 50 percent of all images.
"""
def __init__(self, value=(-20, 20), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(Add, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
self.value = iap.handle_continuous_param(
value, "value", value_range=None, tuple_to_uniform=True,
list_to_choice=True)
self.per_channel = iap.handle_probability_param(
per_channel, "per_channel")
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
if batch.images is None:
return batch
images = batch.images
nb_images = len(images)
nb_channels_max = meta.estimate_max_number_of_channels(images)
rss = random_state.duplicate(2)
per_channel_samples = self.per_channel.draw_samples(
(nb_images,), random_state=rss[0])
value_samples = self.value.draw_samples(
(nb_images, nb_channels_max), random_state=rss[1])
gen = enumerate(zip(images, value_samples, per_channel_samples))
for i, (image, value_samples_i, per_channel_samples_i) in gen:
nb_channels = image.shape[2]
# Example code to directly add images via image+sample (uint8 only)
# if per_channel_samples_i > 0.5:
# result = []
# image = image.astype(np.int16)
# value_samples_i = value_samples_i.astype(np.int16)
# for c, value in enumerate(value_samples_i[0:nb_channels]):
# result.append(
# np.clip(
# image[..., c:c+1] + value, 0, 255
# ).astype(np.uint8))
# images[i] = np.concatenate(result, axis=2)
# else:
# images[i] = np.clip(
# image.astype(np.int16)
# + value_samples_i[0].astype(np.int16),
# 0, 255
# ).astype(np.uint8)
if per_channel_samples_i > 0.5:
value = value_samples_i[0:nb_channels]
else:
# the if/else here catches the case of the channel axis being 0
value = value_samples_i[0] if value_samples_i.size > 0 else []
batch.images[i] = add_scalar(image, value)
return batch
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.value, self.per_channel]
# TODO merge this with Add
[docs]class AddElementwise(meta.Augmenter):
"""
Add to the pixels of images values that are pixelwise randomly sampled.
While the ``Add`` Augmenter samples one value to add *per image* (and
optionally per channel), this augmenter samples different values per image
and *per pixel* (and optionally per channel), i.e. intensities of
neighbouring pixels may be increased/decreased by different amounts.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.add_elementwise`.
Parameters
----------
value : int or tuple of int or list of int or imgaug.parameters.StochasticParameter, optional
Value to add to the pixels.
* If an int, exactly that value will always be used.
* If a tuple ``(a, b)``, then values from the discrete interval
``[a..b]`` will be sampled per image and pixel.
* If a list of integers, a random value will be sampled from the
list per image and pixel.
* If a ``StochasticParameter``, then values will be sampled per
image and pixel from that parameter.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.AddElementwise(10)
Always adds a value of 10 to all channels of all pixels of all input
images.
>>> aug = iaa.AddElementwise((-10, 10))
Samples per image and pixel a value from the discrete interval
``[-10..10]`` and adds that value to the respective pixel.
>>> aug = iaa.AddElementwise((-10, 10), per_channel=True)
Samples per image, pixel *and also channel* a value from the discrete
interval ``[-10..10]`` and adds it to the respective pixel's channel value.
Therefore, added values may differ between channels of the same pixel.
>>> aug = iaa.AddElementwise((-10, 10), per_channel=0.5)
Identical to the previous example, but the `per_channel` feature is only
active for 50 percent of all images.
"""
def __init__(self, value=(-20, 20), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(AddElementwise, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
self.value = iap.handle_continuous_param(
value, "value", value_range=None, tuple_to_uniform=True,
list_to_choice=True)
self.per_channel = iap.handle_probability_param(
per_channel, "per_channel")
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
if batch.images is None:
return batch
images = batch.images
nb_images = len(images)
rss = random_state.duplicate(1+nb_images)
per_channel_samples = self.per_channel.draw_samples(
(nb_images,), random_state=rss[0])
gen = enumerate(zip(images, per_channel_samples, rss[1:]))
for i, (image, per_channel_samples_i, rs) in gen:
height, width, nb_channels = image.shape
sample_shape = (height,
width,
nb_channels if per_channel_samples_i > 0.5 else 1)
values = self.value.draw_samples(sample_shape, random_state=rs)
batch.images[i] = add_elementwise(image, values)
return batch
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.value, self.per_channel]
# TODO rename to AddGaussianNoise?
# TODO examples say that iaa.AdditiveGaussianNoise(scale=(0, 0.1*255)) samples
# the scale from the uniform dist. per image, but is that still the case?
# AddElementwise seems to now sample once for all images, which should
# lead to a single scale value.
[docs]class AdditiveGaussianNoise(AddElementwise):
"""
Add noise sampled from gaussian distributions elementwise to images.
This augmenter samples and adds noise elementwise, i.e. it can add
different noise values to neighbouring pixels and is comparable
to ``AddElementwise``.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.AddElementwise`.
Parameters
----------
loc : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
Mean of the normal distribution from which the noise is sampled.
* If a number, exactly that value will always be used.
* If a tuple ``(a, b)``, a random value from the interval
``[a, b]`` will be sampled per image.
* If a list, then a random value will be sampled from that list per
image.
* If a ``StochasticParameter``, a value will be sampled from the
parameter per image.
scale : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
Standard deviation of the normal distribution that generates the noise.
Must be ``>=0``. If ``0`` then `loc` will simply be added to all
pixels.
* If a number, exactly that value will always be used.
* If a tuple ``(a, b)``, a random value from the interval
``[a, b]`` will be sampled per image.
* If a list, then a random value will be sampled from that list per
image.
* If a ``StochasticParameter``, a value will be sampled from the
parameter per image.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.AdditiveGaussianNoise(scale=0.1*255)
Adds gaussian noise from the distribution ``N(0, 0.1*255)`` to images.
The samples are drawn per image and pixel.
>>> aug = iaa.AdditiveGaussianNoise(scale=(0, 0.1*255))
Adds gaussian noise from the distribution ``N(0, s)`` to images,
where ``s`` is sampled per image from the interval ``[0, 0.1*255]``.
>>> aug = iaa.AdditiveGaussianNoise(scale=0.1*255, per_channel=True)
Adds gaussian noise from the distribution ``N(0, 0.1*255)`` to images,
where the noise value is different per image and pixel *and* channel (e.g.
a different one for red, green and blue channels of the same pixel).
This leads to "colorful" noise.
>>> aug = iaa.AdditiveGaussianNoise(scale=0.1*255, per_channel=0.5)
Identical to the previous example, but the `per_channel` feature is only
active for 50 percent of all images.
"""
def __init__(self, loc=0, scale=(0, 15), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
loc2 = iap.handle_continuous_param(
loc, "loc", value_range=None, tuple_to_uniform=True,
list_to_choice=True)
scale2 = iap.handle_continuous_param(
scale, "scale", value_range=(0, None), tuple_to_uniform=True,
list_to_choice=True)
value = iap.Normal(loc=loc2, scale=scale2)
super(AdditiveGaussianNoise, self).__init__(
value, per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
# TODO add tests
# TODO rename to AddLaplaceNoise?
[docs]class AdditiveLaplaceNoise(AddElementwise):
"""
Add noise sampled from laplace distributions elementwise to images.
The laplace distribution is similar to the gaussian distribution, but
puts more weight on the long tail. Hence, this noise will add more
outliers (very high/low values). It is somewhere between gaussian noise and
salt and pepper noise.
Values of around ``255 * 0.05`` for `scale` lead to visible noise (for
``uint8``).
Values of around ``255 * 0.10`` for `scale` lead to very visible
noise (for ``uint8``).
It is recommended to usually set `per_channel` to ``True``.
This augmenter samples and adds noise elementwise, i.e. it can add
different noise values to neighbouring pixels and is comparable
to ``AddElementwise``.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.AddElementwise`.
Parameters
----------
loc : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
Mean of the laplace distribution that generates the noise.
* If a number, exactly that value will always be used.
* If a tuple ``(a, b)``, a random value from the interval
``[a, b]`` will be sampled per image.
* If a list, then a random value will be sampled from that list per
image.
* If a ``StochasticParameter``, a value will be sampled from the
parameter per image.
scale : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
Standard deviation of the laplace distribution that generates the noise.
Must be ``>=0``. If ``0`` then only `loc` will be used.
Recommended to be around ``255*0.05``.
* If a number, exactly that value will always be used.
* If a tuple ``(a, b)``, a random value from the interval
``[a, b]`` will be sampled per image.
* If a list, then a random value will be sampled from that list per
image.
* If a ``StochasticParameter``, a value will be sampled from the
parameter per image.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.AdditiveLaplaceNoise(scale=0.1*255)
Adds laplace noise from the distribution ``Laplace(0, 0.1*255)`` to images.
The samples are drawn per image and pixel.
>>> aug = iaa.AdditiveLaplaceNoise(scale=(0, 0.1*255))
Adds laplace noise from the distribution ``Laplace(0, s)`` to images,
where ``s`` is sampled per image from the interval ``[0, 0.1*255]``.
>>> aug = iaa.AdditiveLaplaceNoise(scale=0.1*255, per_channel=True)
Adds laplace noise from the distribution ``Laplace(0, 0.1*255)`` to images,
where the noise value is different per image and pixel *and* channel (e.g.
a different one for the red, green and blue channels of the same pixel).
This leads to "colorful" noise.
>>> aug = iaa.AdditiveLaplaceNoise(scale=0.1*255, per_channel=0.5)
Identical to the previous example, but the `per_channel` feature is only
active for 50 percent of all images.
"""
def __init__(self, loc=0, scale=(0, 15), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
loc2 = iap.handle_continuous_param(
loc, "loc", value_range=None, tuple_to_uniform=True,
list_to_choice=True)
scale2 = iap.handle_continuous_param(
scale, "scale", value_range=(0, None), tuple_to_uniform=True,
list_to_choice=True)
value = iap.Laplace(loc=loc2, scale=scale2)
super(AdditiveLaplaceNoise, self).__init__(
value,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
# TODO add tests
# TODO rename to AddPoissonNoise?
[docs]class AdditivePoissonNoise(AddElementwise):
"""
Add noise sampled from poisson distributions elementwise to images.
Poisson noise is comparable to gaussian noise, as e.g. generated via
``AdditiveGaussianNoise``. As poisson distributions produce only positive
numbers, the sign of the sampled values are here randomly flipped.
Values of around ``10.0`` for `lam` lead to visible noise (for ``uint8``).
Values of around ``20.0`` for `lam` lead to very visible noise (for
``uint8``).
It is recommended to usually set `per_channel` to ``True``.
This augmenter samples and adds noise elementwise, i.e. it can add
different noise values to neighbouring pixels and is comparable
to ``AddElementwise``.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.AddElementwise`.
Parameters
----------
lam : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
Lambda parameter of the poisson distribution. Must be ``>=0``.
Recommended values are around ``0.0`` to ``10.0``.
* If a number, exactly that value will always be used.
* If a tuple ``(a, b)``, a random value from the interval
``[a, b]`` will be sampled per image.
* If a list, then a random value will be sampled from that list
per image.
* If a ``StochasticParameter``, a value will be sampled from the
parameter per image.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.AdditivePoissonNoise(lam=5.0)
Adds poisson noise sampled from a poisson distribution with a ``lambda``
parameter of ``5.0`` to images.
The samples are drawn per image and pixel.
>>> aug = iaa.AdditivePoissonNoise(lam=(0.0, 15.0))
Adds poisson noise sampled from ``Poisson(x)`` to images, where ``x`` is
randomly sampled per image from the interval ``[0.0, 15.0]``.
>>> aug = iaa.AdditivePoissonNoise(lam=5.0, per_channel=True)
Adds poisson noise sampled from ``Poisson(5.0)`` to images,
where the values are different per image and pixel *and* channel (e.g. a
different one for red, green and blue channels for the same pixel).
>>> aug = iaa.AdditivePoissonNoise(lam=(0.0, 15.0), per_channel=True)
Adds poisson noise sampled from ``Poisson(x)`` to images,
with ``x`` being sampled from ``uniform(0.0, 15.0)`` per image and
channel. This is the *recommended* configuration.
>>> aug = iaa.AdditivePoissonNoise(lam=(0.0, 15.0), per_channel=0.5)
Identical to the previous example, but the `per_channel` feature is only
active for 50 percent of all images.
"""
def __init__(self, lam=(0.0, 15.0), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
lam2 = iap.handle_continuous_param(
lam, "lam",
value_range=(0, None), tuple_to_uniform=True, list_to_choice=True)
value = iap.RandomSign(iap.Poisson(lam=lam2))
super(AdditivePoissonNoise, self).__init__(
value,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
[docs]class Multiply(meta.Augmenter):
"""
Multiply all pixels in an image with a random value sampled once per image.
This augmenter can be used to make images lighter or darker.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.multiply_scalar`.
Parameters
----------
mul : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
The value with which to multiply the pixel values in each image.
* If a number, then that value will always be used.
* If a tuple ``(a, b)``, then a value from the interval ``[a, b]``
will be sampled per image and used for all pixels.
* If a list, then a random value will be sampled from that list per
image.
* If a ``StochasticParameter``, then that parameter will be used to
sample a new value per image.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Multiply(2.0)
Multiplies all images by a factor of ``2``, making the images significantly
brighter.
>>> aug = iaa.Multiply((0.5, 1.5))
Multiplies images by a random value sampled uniformly from the interval
``[0.5, 1.5]``, making some images darker and others brighter.
>>> aug = iaa.Multiply((0.5, 1.5), per_channel=True)
Identical to the previous example, but the sampled multipliers differ by
image *and* channel, instead of only by image.
>>> aug = iaa.Multiply((0.5, 1.5), per_channel=0.5)
Identical to the previous example, but the `per_channel` feature is only
active for 50 percent of all images.
"""
def __init__(self, mul=(0.8, 1.2), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(Multiply, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
self.mul = iap.handle_continuous_param(
mul, "mul", value_range=None, tuple_to_uniform=True,
list_to_choice=True)
self.per_channel = iap.handle_probability_param(
per_channel, "per_channel")
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
if batch.images is None:
return batch
images = batch.images
nb_images = len(images)
nb_channels_max = meta.estimate_max_number_of_channels(images)
rss = random_state.duplicate(2)
per_channel_samples = self.per_channel.draw_samples(
(nb_images,), random_state=rss[0])
mul_samples = self.mul.draw_samples(
(nb_images, nb_channels_max), random_state=rss[1])
gen = enumerate(zip(images, mul_samples, per_channel_samples))
for i, (image, mul_samples_i, per_channel_samples_i) in gen:
nb_channels = image.shape[2]
# Example code to directly multiply images via image*sample
# (uint8 only) -- apparently slower than LUT
# if per_channel_samples_i > 0.5:
# result = []
# image = image.astype(np.float32)
# mul_samples_i = mul_samples_i.astype(np.float32)
# for c, mul in enumerate(mul_samples_i[0:nb_channels]):
# result.append(
# np.clip(
# image[..., c:c+1] * mul, 0, 255
# ).astype(np.uint8))
# images[i] = np.concatenate(result, axis=2)
# else:
# images[i] = np.clip(
# image.astype(np.float32)
# * mul_samples_i[0].astype(np.float32),
# 0, 255
# ).astype(np.uint8)
if per_channel_samples_i > 0.5:
mul = mul_samples_i[0:nb_channels]
else:
# the if/else here catches the case of the channel axis being 0
mul = mul_samples_i[0] if mul_samples_i.size > 0 else []
batch.images[i] = multiply_scalar(image, mul)
return batch
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.mul, self.per_channel]
# TODO merge with Multiply
[docs]class MultiplyElementwise(meta.Augmenter):
"""
Multiply image pixels with values that are pixelwise randomly sampled.
While the ``Multiply`` Augmenter uses a constant multiplier *per
image* (and optionally channel), this augmenter samples the multipliers
to use per image and *per pixel* (and optionally per channel).
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.multiply_elementwise`.
Parameters
----------
mul : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
The value with which to multiply pixel values in the image.
* If a number, then that value will always be used.
* If a tuple ``(a, b)``, then a value from the interval ``[a, b]``
will be sampled per image and pixel.
* If a list, then a random value will be sampled from that list
per image and pixel.
* If a ``StochasticParameter``, then that parameter will be used to
sample a new value per image and pixel.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.MultiplyElementwise(2.0)
Multiply all images by a factor of ``2.0``, making them significantly
bighter.
>>> aug = iaa.MultiplyElementwise((0.5, 1.5))
Samples per image and pixel uniformly a value from the interval
``[0.5, 1.5]`` and multiplies the pixel with that value.
>>> aug = iaa.MultiplyElementwise((0.5, 1.5), per_channel=True)
Samples per image and pixel *and channel* uniformly a value from the
interval ``[0.5, 1.5]`` and multiplies the pixel with that value. Therefore,
used multipliers may differ between channels of the same pixel.
>>> aug = iaa.MultiplyElementwise((0.5, 1.5), per_channel=0.5)
Identical to the previous example, but the `per_channel` feature is only
active for 50 percent of all images.
"""
def __init__(self, mul=(0.8, 1.2), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(MultiplyElementwise, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
self.mul = iap.handle_continuous_param(
mul, "mul",
value_range=None, tuple_to_uniform=True, list_to_choice=True)
self.per_channel = iap.handle_probability_param(per_channel,
"per_channel")
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
if batch.images is None:
return batch
images = batch.images
nb_images = len(images)
rss = random_state.duplicate(1+nb_images)
per_channel_samples = self.per_channel.draw_samples(
(nb_images,), random_state=rss[0])
is_mul_binomial = isinstance(self.mul, iap.Binomial) or (
isinstance(self.mul, iap.FromLowerResolution)
and isinstance(self.mul.other_param, iap.Binomial)
)
gen = enumerate(zip(images, per_channel_samples, rss[1:]))
for i, (image, per_channel_samples_i, rs) in gen:
height, width, nb_channels = image.shape
sample_shape = (height,
width,
nb_channels if per_channel_samples_i > 0.5 else 1)
mul = self.mul.draw_samples(sample_shape, random_state=rs)
# TODO let Binomial return boolean mask directly instead of [0, 1]
# integers?
# hack to improve performance for Dropout and CoarseDropout
# converts mul samples to mask if mul is binomial
if mul.dtype.kind != "b" and is_mul_binomial:
mul = mul.astype(bool, copy=False)
batch.images[i] = multiply_elementwise(image, mul)
return batch
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.mul, self.per_channel]
# Added in 0.4.0.
class _CutoutSamples(object):
# Added in 0.4.0.
def __init__(self, nb_iterations, pos_x, pos_y, size_h, size_w, squared,
fill_mode, cval, fill_per_channel):
self.nb_iterations = nb_iterations
self.pos_x = pos_x
self.pos_y = pos_y
self.size_h = size_h
self.size_w = size_w
self.squared = squared
self.fill_mode = fill_mode
self.cval = cval
self.fill_per_channel = fill_per_channel
[docs]class Cutout(meta.Augmenter):
"""Fill one or more rectangular areas in an image using a fill mode.
See paper "Improved Regularization of Convolutional Neural Networks with
Cutout" by DeVries and Taylor.
In contrast to the paper, this implementation also supports replacing
image sub-areas with gaussian noise, random intensities or random RGB
colors. It also supports non-squared areas. While the paper uses
absolute pixel values for the size and position, this implementation
uses relative values, which seems more appropriate for mixed-size
datasets. The position parameter furthermore allows more flexibility, e.g.
gaussian distributions around the center.
.. note::
This augmenter affects only image data. Other datatypes (e.g.
segmentation map pixels or keypoints within the filled areas)
are not affected.
.. note::
Gaussian fill mode will assume that float input images contain values
in the interval ``[0.0, 1.0]`` and hence sample values from a
gaussian within that interval, i.e. from ``N(0.5, std=0.5/3)``.
Added in 0.4.0.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.cutout_`.
Parameters
----------
nb_iterations : int or tuple of int or list of int or imgaug.parameters.StochasticParameter, optional
How many rectangular areas to fill.
* If ``int``: Exactly that many areas will be filled on all images.
* If ``tuple`` ``(a, b)``: A value from the interval ``[a, b]``
will be sampled per image.
* If ``list``: A random value will be sampled from that ``list``
per image.
* If ``StochasticParameter``: That parameter will be used to
sample ``(B,)`` values per batch of ``B`` images.
position : {'uniform', 'normal', 'center', 'left-top', 'left-center', 'left-bottom', 'center-top', 'center-center', 'center-bottom', 'right-top', 'right-center', 'right-bottom'} or tuple of float or StochasticParameter or tuple of StochasticParameter, optional
Defines the position of each area to fill.
Analogous to the definition in e.g.
:class:`~imgaug.augmenters.size.CropToFixedSize`.
Usually, ``uniform`` (anywhere in the image) or ``normal`` (anywhere
in the image with preference around the center) are sane values.
size : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
The size of the rectangle to fill as a fraction of the corresponding
image size, i.e. with value range ``[0.0, 1.0]``. The size is sampled
independently per image axis.
* If ``number``: Exactly that size is always used.
* If ``tuple`` ``(a, b)``: A value from the interval ``[a, b]``
will be sampled per area and axis.
* If ``list``: A random value will be sampled from that ``list``
per area and axis.
* If ``StochasticParameter``: That parameter will be used to
sample ``(N, 2)`` values per batch, where ``N`` is the total
number of areas to fill within the whole batch.
squared : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to generate only squared areas cutout areas or allow
rectangular ones. If this evaluates to a true-like value, the
first value from `size` will be converted to absolute pixels and used
for both axes.
If this value is a float ``p``, then for ``p`` percent of all areas
to be filled `per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
fill_mode : str or list of str or imgaug.parameters.StochasticParameter, optional
Mode to use in order to fill areas. Corresponds to ``mode`` parameter
in some other augmenters. Valid strings for the mode are:
* ``contant``: Fill each area with a single value.
* ``gaussian``: Fill each area with gaussian noise.
Valid datatypes are:
* If ``str``: Exactly that mode will alaways be used.
* If ``list``: A random value will be sampled from that ``list``
per area.
* If ``StochasticParameter``: That parameter will be used to
sample ``(N,)`` values per batch, where ``N`` is the total number
of areas to fill within the whole batch.
cval : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
The value to use (i.e. the color) to fill areas if `fill_mode` is
```constant``.
* If ``number``: Exactly that value is used for all areas
and channels.
* If ``tuple`` ``(a, b)``: A value from the interval ``[a, b]``
will be sampled per area (and channel if ``per_channel=True``).
* If ``list``: A random value will be sampled from that ``list``
per area (and channel if ``per_channel=True``).
* If ``StochasticParameter``: That parameter will be used to
sample ``(N, Cmax)`` values per batch, where ``N`` is the total
number of areas to fill within the whole batch and ``Cmax``
is the maximum number of channels in any image (usually ``3``).
If ``per_channel=False``, only the first value of the second
axis is used.
fill_per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to fill each area in a channelwise fashion (``True``) or
not (``False``).
The behaviour per fill mode is:
* ``constant``: Whether to fill all channels with the same value
(i.e, grayscale) or different values (i.e. usually RGB color).
* ``gaussian``: Whether to sample once from a gaussian and use the
values for all channels (i.e. grayscale) or to sample
channelwise (i.e. RGB colors)
If this value is a float ``p``, then for ``p`` percent of all areas
to be filled `per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
deterministic : bool, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.bit_generator.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Cutout(nb_iterations=2)
Fill per image two random areas, by default with grayish pixels.
>>> aug = iaa.Cutout(nb_iterations=(1, 5), size=0.2, squared=False)
Fill per image between one and five areas, each having ``20%``
of the corresponding size of the height and width (for non-square
images this results in non-square areas to be filled).
>>> aug = iaa.Cutout(fill_mode="constant", cval=255)
Fill all areas with white pixels.
>>> aug = iaa.Cutout(fill_mode="constant", cval=(0, 255),
>>> fill_per_channel=0.5)
Fill ``50%`` of all areas with a random intensity value between
``0`` and ``256``. Fill the other ``50%`` of all areas with
random colors.
>>> aug = iaa.Cutout(fill_mode="gaussian", fill_per_channel=True)
Fill areas with gaussian channelwise noise (i.e. usually RGB).
"""
# Added in 0.4.0.
def __init__(self,
nb_iterations=1,
position="uniform",
size=0.2,
squared=True,
fill_mode="constant",
cval=128,
fill_per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
from .size import _handle_position_parameter # TODO move to iap
from .geometric import _handle_cval_arg # TODO move to iap
super(Cutout, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
self.nb_iterations = iap.handle_discrete_param(
nb_iterations, "nb_iterations", value_range=(0, None),
tuple_to_uniform=True, list_to_choice=True, allow_floats=False)
self.position = _handle_position_parameter(position)
self.size = iap.handle_continuous_param(
size, "size", value_range=(0.0, 1.0+1e-4),
tuple_to_uniform=True, list_to_choice=True)
self.squared = iap.handle_probability_param(squared, "squared")
self.fill_mode = self._handle_fill_mode_param(fill_mode)
self.cval = _handle_cval_arg(cval)
self.fill_per_channel = iap.handle_probability_param(
fill_per_channel, "fill_per_channel")
# Added in 0.4.0.
@classmethod
def _handle_fill_mode_param(cls, fill_mode):
if ia.is_string(fill_mode):
assert fill_mode in _CUTOUT_FILL_MODES, (
"Expected 'fill_mode' to be one of: %s. Got %s." % (
str(list(_CUTOUT_FILL_MODES.keys())), fill_mode))
return iap.Deterministic(fill_mode)
if isinstance(fill_mode, iap.StochasticParameter):
return fill_mode
assert ia.is_iterable(fill_mode), (
"Expected 'fill_mode' to be a string, "
"StochasticParameter or list of strings. Got type %s." % (
type(fill_mode).__name__))
return iap.Choice(fill_mode)
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
if batch.images is None:
return batch
samples = self._draw_samples(batch.images, random_state)
# map from xyhw to xyxy (both relative coords)
cutout_height_half = samples.size_h / 2
cutout_width_half = samples.size_w / 2
x1_rel = samples.pos_x - cutout_width_half
y1_rel = samples.pos_y - cutout_height_half
x2_rel = samples.pos_x + cutout_width_half
y2_rel = samples.pos_y + cutout_height_half
nb_iterations_sum = 0
gen = enumerate(zip(batch.images, samples.nb_iterations))
for i, (image, nb_iterations) in gen:
start = nb_iterations_sum
end = start + nb_iterations
height, width = image.shape[0:2]
# map from relative xyxy to absolute xyxy coords
batch.images[i] = self._augment_image_by_samples(
image,
x1_rel[start:end] * width,
y1_rel[start:end] * height,
x2_rel[start:end] * width,
y2_rel[start:end] * height,
samples.squared[start:end],
samples.fill_mode[start:end],
samples.cval[start:end],
samples.fill_per_channel[start:end],
random_state)
nb_iterations_sum += nb_iterations
return batch
# Added in 0.4.0.
def _draw_samples(self, images, random_state):
rngs = random_state.duplicate(8)
nb_rows = len(images)
nb_channels_max = meta.estimate_max_number_of_channels(images)
nb_iterations = self.nb_iterations.draw_samples(
(nb_rows,), random_state=rngs[0])
nb_dropped_areas = int(np.sum(nb_iterations))
if isinstance(self.position, tuple):
pos_x = self.position[0].draw_samples((nb_dropped_areas,),
random_state=rngs[1])
pos_y = self.position[1].draw_samples((nb_dropped_areas,),
random_state=rngs[2])
else:
pos = self.position.draw_samples((nb_dropped_areas, 2),
random_state=rngs[1])
pos_x = pos[:, 0]
pos_y = pos[:, 1]
size = self.size.draw_samples((nb_dropped_areas, 2),
random_state=rngs[3])
squared = self.squared.draw_samples((nb_dropped_areas,),
random_state=rngs[4])
fill_mode = self.fill_mode.draw_samples(
(nb_dropped_areas,), random_state=rngs[5])
cval = self.cval.draw_samples((nb_dropped_areas, nb_channels_max),
random_state=rngs[6])
fill_per_channel = self.fill_per_channel.draw_samples(
(nb_dropped_areas,), random_state=rngs[7])
return _CutoutSamples(
nb_iterations=nb_iterations,
pos_x=pos_x,
pos_y=pos_y,
size_h=size[:, 0],
size_w=size[:, 1],
squared=squared,
fill_mode=fill_mode,
cval=cval,
fill_per_channel=fill_per_channel
)
# Added in 0.4.0.
@classmethod
def _augment_image_by_samples(cls, image, x1, y1, x2, y2, squared,
fill_mode, cval, fill_per_channel,
random_state):
for i, x1_i in enumerate(x1):
x2_i = x2[i]
if squared[i] >= 0.5:
height_h = (y2[i] - y1[i]) / 2
x_center = x1_i + (x2_i - x1_i) / 2
x1_i = x_center - height_h
x2_i = x_center + height_h
image = cutout_(
image,
x1=x1_i,
y1=y1[i],
x2=x2_i,
y2=y2[i],
fill_mode=fill_mode[i],
cval=cval[i],
fill_per_channel=fill_per_channel[i],
seed=random_state)
return image
# Added in 0.4.0.
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.nb_iterations, self.position, self.size, self.squared,
self.fill_mode, self.cval, self.fill_per_channel]
# TODO verify that (a, b) still leads to a p being sampled per image and not
# per batch
[docs]class Dropout(MultiplyElementwise):
"""
Set a fraction of pixels in images to zero.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.MultiplyElementwise`.
Parameters
----------
p : float or tuple of float or imgaug.parameters.StochasticParameter, optional
The probability of any pixel being dropped (i.e. to set it to zero).
* If a float, then that value will be used for all images. A value
of ``1.0`` would mean that all pixels will be dropped
and ``0.0`` that no pixels will be dropped. A value of ``0.05``
corresponds to ``5`` percent of all pixels being dropped.
* If a tuple ``(a, b)``, then a value ``p`` will be sampled from
the interval ``[a, b]`` per image and be used as the pixel's
dropout probability.
* If a list, then a value will be sampled from that list per
batch and used as the probability.
* If a ``StochasticParameter``, then this parameter will be used to
determine per pixel whether it should be *kept* (sampled value
of ``>0.5``) or shouldn't be kept (sampled value of ``<=0.5``).
If you instead want to provide the probability as a stochastic
parameter, you can usually do ``imgaug.parameters.Binomial(1-p)``
to convert parameter `p` to a 0/1 representation.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Dropout(0.02)
Drops ``2`` percent of all pixels.
>>> aug = iaa.Dropout((0.0, 0.05))
Drops in each image a random fraction of all pixels, where the fraction
is uniformly sampled from the interval ``[0.0, 0.05]``.
>>> aug = iaa.Dropout(0.02, per_channel=True)
Drops ``2`` percent of all pixels in a channelwise fashion, i.e. it is
unlikely for any pixel to have all channels set to zero (black pixels).
>>> aug = iaa.Dropout(0.02, per_channel=0.5)
Identical to the previous example, but the `per_channel` feature is only
active for ``50`` percent of all images.
"""
def __init__(self, p=(0.0, 0.05), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
p_param = _handle_dropout_probability_param(p, "p")
super(Dropout, self).__init__(
p_param,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
# Added in 0.4.0.
def _handle_dropout_probability_param(p, name):
if ia.is_single_number(p):
p_param = iap.Binomial(1 - p)
elif isinstance(p, tuple):
assert len(p) == 2, (
"Expected `%s` to be given as a tuple containing exactly 2 values, "
"got %d values." % (name, len(p),))
assert p[0] < p[1], (
"Expected `%s` to be given as a tuple containing exactly 2 values "
"(a, b) with a < b. Got %.4f and %.4f." % (name, p[0], p[1]))
assert 0 <= p[0] <= 1.0 and 0 <= p[1] <= 1.0, (
"Expected `%s` given as tuple to only contain values in the "
"interval [0.0, 1.0], got %.4f and %.4f." % (name, p[0], p[1]))
p_param = iap.Binomial(iap.Uniform(1 - p[1], 1 - p[0]))
elif ia.is_iterable(p):
assert all([ia.is_single_number(v) for v in p]), (
"Expected iterable parameter '%s' to only contain numbers, "
"got %s." % (name, [type(v) for v in p],))
assert all([0 <= p_i <= 1.0 for p_i in p]), (
"Expected iterable parameter '%s' to only contain probabilities "
"in the interval [0.0, 1.0], got values %s." % (
name, ", ".join(["%.4f" % (p_i,) for p_i in p])))
p_param = iap.Binomial(1 - iap.Choice(p))
elif isinstance(p, iap.StochasticParameter):
p_param = p
else:
raise Exception(
"Expected `%s` to be float or int or tuple (<number>, <number>) "
"or StochasticParameter, got type '%s'." % (
name, type(p).__name__,))
return p_param
# TODO invert size_px and size_percent so that larger values denote larger
# areas being dropped instead of the opposite way around
[docs]class CoarseDropout(MultiplyElementwise):
"""
Set rectangular areas within images to zero.
In contrast to ``Dropout``, these areas can have larger sizes.
(E.g. you might end up with three large black rectangles in an image.)
Note that the current implementation leads to correlated sizes,
so if e.g. there is any thin and high rectangle that is dropped, there is
a high likelihood that all other dropped areas are also thin and high.
This method is implemented by generating the dropout mask at a
lower resolution (than the image has) and then upsampling the mask
before dropping the pixels.
This augmenter is similar to Cutout. Usually, cutout is defined as an
operation that drops exactly one rectangle from an image, while here
``CoarseDropout`` can drop multiple rectangles (with some correlation
between the sizes of these rectangles).
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.MultiplyElementwise`.
Parameters
----------
p : float or tuple of float or imgaug.parameters.StochasticParameter, optional
The probability of any pixel being dropped (i.e. set to zero) in
the lower-resolution dropout mask.
* If a float, then that value will be used for all pixels. A value
of ``1.0`` would mean, that all pixels will be dropped. A value
of ``0.0`` would lead to no pixels being dropped.
* If a tuple ``(a, b)``, then a value ``p`` will be sampled from
the interval ``[a, b]`` per image and be used as the dropout
probability.
* If a list, then a value will be sampled from that list per
batch and used as the probability.
* If a ``StochasticParameter``, then this parameter will be used to
determine per pixel whether it should be *kept* (sampled value
of ``>0.5``) or shouldn't be kept (sampled value of ``<=0.5``).
If you instead want to provide the probability as a stochastic
parameter, you can usually do ``imgaug.parameters.Binomial(1-p)``
to convert parameter `p` to a 0/1 representation.
size_px : None or int or tuple of int or imgaug.parameters.StochasticParameter, optional
The size of the lower resolution image from which to sample the dropout
mask in absolute pixel dimensions.
Note that this means that *lower* values of this parameter lead to
*larger* areas being dropped (as any pixel in the lower resolution
image will correspond to a larger area at the original resolution).
* If ``None`` then `size_percent` must be set.
* If an integer, then that size will always be used for both height
and width. E.g. a value of ``3`` would lead to a ``3x3`` mask,
which is then upsampled to ``HxW``, where ``H`` is the image size
and ``W`` the image width.
* If a tuple ``(a, b)``, then two values ``M``, ``N`` will be
sampled from the discrete interval ``[a..b]``. The dropout mask
will then be generated at size ``MxN`` and upsampled to ``HxW``.
* If a ``StochasticParameter``, then this parameter will be used to
determine the sizes. It is expected to be discrete.
size_percent : None or float or tuple of float or imgaug.parameters.StochasticParameter, optional
The size of the lower resolution image from which to sample the dropout
mask *in percent* of the input image.
Note that this means that *lower* values of this parameter lead to
*larger* areas being dropped (as any pixel in the lower resolution
image will correspond to a larger area at the original resolution).
* If ``None`` then `size_px` must be set.
* If a float, then that value will always be used as the percentage
of the height and width (relative to the original size). E.g. for
value ``p``, the mask will be sampled from ``(p*H)x(p*W)`` and
later upsampled to ``HxW``.
* If a tuple ``(a, b)``, then two values ``m``, ``n`` will be
sampled from the interval ``(a, b)`` and used as the size
fractions, i.e the mask size will be ``(m*H)x(n*W)``.
* If a ``StochasticParameter``, then this parameter will be used to
sample the percentage values. It is expected to be continuous.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
min_size : int, optional
Minimum height and width of the low resolution mask. If
`size_percent` or `size_px` leads to a lower value than this,
`min_size` will be used instead. This should never have a value of
less than ``2``, otherwise one may end up with a ``1x1`` low resolution
mask, leading easily to the whole image being dropped.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.CoarseDropout(0.02, size_percent=0.5)
Drops ``2`` percent of all pixels on a lower-resolution image that has
``50`` percent of the original image's size, leading to dropped areas that
have roughly ``2x2`` pixels size.
>>> aug = iaa.CoarseDropout((0.0, 0.05), size_percent=(0.05, 0.5))
Generates a dropout mask at ``5`` to ``50`` percent of each input image's
size. In that mask, ``0`` to ``5`` percent of all pixels are marked as
being dropped. The mask is afterwards projected to the input image's
size to apply the actual dropout operation.
>>> aug = iaa.CoarseDropout((0.0, 0.05), size_px=(2, 16))
Same as the previous example, but the lower resolution image has ``2`` to
``16`` pixels size. On images of e.g. ``224x224` pixels in size this would
lead to fairly large areas being dropped (height/width of ``224/2`` to
``224/16``).
>>> aug = iaa.CoarseDropout(0.02, size_percent=0.5, per_channel=True)
Drops ``2`` percent of all pixels at ``50`` percent resolution (``2x2``
sizes) in a channel-wise fashion, i.e. it is unlikely for any pixel to
have all channels set to zero (black pixels).
>>> aug = iaa.CoarseDropout(0.02, size_percent=0.5, per_channel=0.5)
Same as the previous example, but the `per_channel` feature is only active
for ``50`` percent of all images.
"""
def __init__(self, p=(0.02, 0.1), size_px=None, size_percent=None,
per_channel=False, min_size=3,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
p_param = _handle_dropout_probability_param(p, "p")
if size_px is not None:
p_param = iap.FromLowerResolution(other_param=p_param,
size_px=size_px,
min_size=min_size)
elif size_percent is not None:
p_param = iap.FromLowerResolution(other_param=p_param,
size_percent=size_percent,
min_size=min_size)
else:
# default if neither size_px nor size_percent is provided
# is size_px=(3, 8)
p_param = iap.FromLowerResolution(other_param=p_param,
size_px=(3, 8),
min_size=min_size)
super(CoarseDropout, self).__init__(
p_param,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
[docs]class Dropout2d(meta.Augmenter):
"""Drop random channels from images.
For image data, dropped channels will be filled with zeros.
.. note::
This augmenter may also set the arrays of heatmaps and segmentation
maps to zero and remove all coordinate-based data (e.g. it removes
all bounding boxes on images that were filled with zeros).
It does so if and only if *all* channels of an image are dropped.
If ``nb_keep_channels >= 1`` then that never happens.
Added in 0.4.0.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: yes; tested
* ``uint32``: yes; tested
* ``uint64``: yes; tested
* ``int8``: yes; tested
* ``int16``: yes; tested
* ``int32``: yes; tested
* ``int64``: yes; tested
* ``float16``: yes; tested
* ``float32``: yes; tested
* ``float64``: yes; tested
* ``float128``: yes; tested
* ``bool``: yes; tested
Parameters
----------
p : float or tuple of float or imgaug.parameters.StochasticParameter, optional
The probability of any channel to be dropped (i.e. set to zero).
* If a ``float``, then that value will be used for all channels.
A value of ``1.0`` would mean, that all channels will be dropped.
A value of ``0.0`` would lead to no channels being dropped.
* If a tuple ``(a, b)``, then a value ``p`` will be sampled from
the interval ``[a, b)`` per batch and be used as the dropout
probability.
* If a list, then a value will be sampled from that list per
batch and used as the probability.
* If a ``StochasticParameter``, then this parameter will be used to
determine per channel whether it should be *kept* (sampled value
of ``>=0.5``) or shouldn't be kept (sampled value of ``<0.5``).
If you instead want to provide the probability as a stochastic
parameter, you can usually do ``imgaug.parameters.Binomial(1-p)``
to convert parameter `p` to a 0/1 representation.
nb_keep_channels : int
Minimum number of channels to keep unaltered in all images.
E.g. a value of ``1`` means that at least one channel in every image
will not be dropped, even if ``p=1.0``. Set to ``0`` to allow dropping
all channels.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Dropout2d(p=0.5)
Create a dropout augmenter that drops on average half of all image
channels. Dropped channels will be filled with zeros. At least one
channel is kept unaltered in each image (default setting).
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Dropout2d(p=0.5, nb_keep_channels=0)
Create a dropout augmenter that drops on average half of all image
channels *and* may drop *all* channels in an image (i.e. images may
contain nothing but zeros).
"""
# Added in 0.4.0.
def __init__(self, p=0.1, nb_keep_channels=1,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(Dropout2d, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
self.p = _handle_dropout_probability_param(p, "p")
self.nb_keep_channels = max(nb_keep_channels, 0)
self._drop_images = True
self._drop_heatmaps = True
self._drop_segmentation_maps = True
self._drop_keypoints = True
self._drop_bounding_boxes = True
self._drop_polygons = True
self._drop_line_strings = True
self._heatmaps_cval = 0.0
self._segmentation_maps_cval = 0
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
imagewise_drop_channel_ids, all_dropped_ids = self._draw_samples(
batch, random_state)
if batch.images is not None:
for image, drop_ids in zip(batch.images,
imagewise_drop_channel_ids):
image[:, :, drop_ids] = 0
# Skip the non-image data steps below if we won't modify non-image
# anyways. Minor performance improvement.
if len(all_dropped_ids) == 0:
return batch
if batch.heatmaps is not None and self._drop_heatmaps:
cval = self._heatmaps_cval
for drop_idx in all_dropped_ids:
batch.heatmaps[drop_idx].arr_0to1[...] = cval
if batch.segmentation_maps is not None and self._drop_segmentation_maps:
cval = self._segmentation_maps_cval
for drop_idx in all_dropped_ids:
batch.segmentation_maps[drop_idx].arr[...] = cval
for attr_name in ["keypoints", "bounding_boxes", "polygons",
"line_strings"]:
do_drop = getattr(self, "_drop_%s" % (attr_name,))
attr_value = getattr(batch, attr_name)
if attr_value is not None and do_drop:
for drop_idx in all_dropped_ids:
# same as e.g.:
# batch.bounding_boxes[drop_idx].bounding_boxes = []
setattr(attr_value[drop_idx], attr_name, [])
return batch
# Added in 0.4.0.
def _draw_samples(self, batch, random_state):
# maybe noteworthy here that the channel axis can have size 0,
# e.g. (5, 5, 0)
shapes = batch.get_rowwise_shapes()
shapes = [shape
if len(shape) >= 2
else tuple(list(shape) + [1])
for shape in shapes]
imagewise_channels = np.array([
shape[2] for shape in shapes
], dtype=np.int32)
# channelwise drop value over all images (float <0.5 = drop channel)
p_samples = self.p.draw_samples((int(np.sum(imagewise_channels)),),
random_state=random_state)
# We map the flat p_samples array to an imagewise one,
# convert the mask to channel-ids to drop and remove channel ids if
# there are more to be dropped than are allowed to be dropped (see
# nb_keep_channels).
# We also track all_dropped_ids, which contains the ids of examples
# (not channel ids!) where all channels were dropped.
imagewise_channels_to_drop = []
all_dropped_ids = []
channel_idx = 0
for i, nb_channels in enumerate(imagewise_channels):
p_samples_i = p_samples[channel_idx:channel_idx+nb_channels]
drop_ids = np.nonzero(p_samples_i < 0.5)[0]
nb_dropable = max(nb_channels - self.nb_keep_channels, 0)
if len(drop_ids) > nb_dropable:
random_state.shuffle(drop_ids)
drop_ids = drop_ids[:nb_dropable]
imagewise_channels_to_drop.append(drop_ids)
all_dropped = (len(drop_ids) == nb_channels)
if all_dropped:
all_dropped_ids.append(i)
channel_idx += nb_channels
return imagewise_channels_to_drop, all_dropped_ids
# Added in 0.4.0.
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.p, self.nb_keep_channels]
[docs]class TotalDropout(meta.Augmenter):
"""Drop all channels of a defined fraction of all images.
For image data, all components of dropped images will be filled with zeros.
.. note::
This augmenter also sets the arrays of heatmaps and segmentation
maps to zero and removes all coordinate-based data (e.g. it removes
all bounding boxes on images that were filled with zeros).
Added in 0.4.0.
**Supported dtypes**:
* ``uint8``: yes; fully tested
* ``uint16``: yes; tested
* ``uint32``: yes; tested
* ``uint64``: yes; tested
* ``int8``: yes; tested
* ``int16``: yes; tested
* ``int32``: yes; tested
* ``int64``: yes; tested
* ``float16``: yes; tested
* ``float32``: yes; tested
* ``float64``: yes; tested
* ``float128``: yes; tested
* ``bool``: yes; tested
Parameters
----------
p : float or tuple of float or imgaug.parameters.StochasticParameter, optional
The probability of an image to be filled with zeros.
* If ``float``: The value will be used for all images.
A value of ``1.0`` would mean that all images will be set to zero.
A value of ``0.0`` would lead to no images being set to zero.
* If ``tuple`` ``(a, b)``: A value ``p`` will be sampled from
the interval ``[a, b)`` per batch and be used as the dropout
probability.
* If a list, then a value will be sampled from that list per
batch and used as the probability.
* If ``StochasticParameter``: The parameter will be used to
determine per image whether it should be *kept* (sampled value
of ``>=0.5``) or shouldn't be kept (sampled value of ``<0.5``).
If you instead want to provide the probability as a stochastic
parameter, you can usually do ``imgaug.parameters.Binomial(1-p)``
to convert parameter `p` to a 0/1 representation.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.TotalDropout(1.0)
Create an augmenter that sets *all* components of all images to zero.
>>> aug = iaa.TotalDropout(0.5)
Create an augmenter that sets *all* components of ``50%`` of all images to
zero.
"""
# Added in 0.4.0.
def __init__(self, p=1,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(TotalDropout, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
self.p = _handle_dropout_probability_param(p, "p")
self._drop_images = True
self._drop_heatmaps = True
self._drop_segmentation_maps = True
self._drop_keypoints = True
self._drop_bounding_boxes = True
self._drop_polygons = True
self._drop_line_strings = True
self._heatmaps_cval = 0.0
self._segmentation_maps_cval = 0
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
drop_mask = self._draw_samples(batch, random_state)
drop_ids = None
if batch.images is not None and self._drop_images:
if ia.is_np_array(batch.images):
batch.images[drop_mask, ...] = 0
else:
drop_ids = self._generate_drop_ids_once(drop_mask, drop_ids)
for drop_idx in drop_ids:
batch.images[drop_idx][...] = 0
if batch.heatmaps is not None and self._drop_heatmaps:
drop_ids = self._generate_drop_ids_once(drop_mask, drop_ids)
cval = self._heatmaps_cval
for drop_idx in drop_ids:
batch.heatmaps[drop_idx].arr_0to1[...] = cval
if batch.segmentation_maps is not None and self._drop_segmentation_maps:
drop_ids = self._generate_drop_ids_once(drop_mask, drop_ids)
cval = self._segmentation_maps_cval
for drop_idx in drop_ids:
batch.segmentation_maps[drop_idx].arr[...] = cval
for attr_name in ["keypoints", "bounding_boxes", "polygons",
"line_strings"]:
do_drop = getattr(self, "_drop_%s" % (attr_name,))
attr_value = getattr(batch, attr_name)
if attr_value is not None and do_drop:
drop_ids = self._generate_drop_ids_once(drop_mask, drop_ids)
for drop_idx in drop_ids:
# same as e.g.:
# batch.bounding_boxes[drop_idx].bounding_boxes = []
setattr(attr_value[drop_idx], attr_name, [])
return batch
# Added in 0.4.0.
def _draw_samples(self, batch, random_state):
p = self.p.draw_samples((batch.nb_rows,), random_state=random_state)
drop_mask = (p < 0.5)
return drop_mask
# Added in 0.4.0.
@classmethod
def _generate_drop_ids_once(cls, drop_mask, drop_ids):
if drop_ids is None:
drop_ids = np.nonzero(drop_mask)[0]
return drop_ids
# Added in 0.4.0.
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.p]
[docs]class ReplaceElementwise(meta.Augmenter):
"""
Replace pixels in an image with new values.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.replace_elementwise_`.
Parameters
----------
mask : float or tuple of float or list of float or imgaug.parameters.StochasticParameter
Mask that indicates the pixels that are supposed to be replaced.
The mask will be binarized using a threshold of ``0.5``. A value
of ``1`` then indicates a pixel that is supposed to be replaced.
* If this is a float, then that value will be used as the
probability of being a ``1`` in the mask (sampled per image and
pixel) and hence being replaced.
* If a tuple ``(a, b)``, then the probability will be uniformly
sampled per image from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image and pixel.
* If a ``StochasticParameter``, then this parameter will be used to
sample a mask per image.
replacement : number or tuple of number or list of number or imgaug.parameters.StochasticParameter
The replacement to use at all locations that are marked as ``1`` in
the mask.
* If this is a number, then that value will always be used as the
replacement.
* If a tuple ``(a, b)``, then the replacement will be sampled
uniformly per image and pixel from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image and pixel.
* If a ``StochasticParameter``, then this parameter will be used
sample replacement values per image and pixel.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = ReplaceElementwise(0.05, [0, 255])
Replaces ``5`` percent of all pixels in each image by either ``0``
or ``255``.
>>> import imgaug.augmenters as iaa
>>> aug = ReplaceElementwise(0.1, [0, 255], per_channel=0.5)
For ``50%`` of all images, replace ``10%`` of all pixels with either the
value ``0`` or the value ``255`` (same as in the previous example). For
the other ``50%`` of all images, replace *channelwise* ``10%`` of all
pixels with either the value ``0`` or the value ``255``. So, it will be
very rare for each pixel to have all channels replaced by ``255`` or
``0``.
>>> import imgaug.augmenters as iaa
>>> import imgaug.parameters as iap
>>> aug = ReplaceElementwise(0.1, iap.Normal(128, 0.4*128), per_channel=0.5)
Replace ``10%`` of all pixels by gaussian noise centered around ``128``.
Both the replacement mask and the gaussian noise are sampled channelwise
for ``50%`` of all images.
>>> import imgaug.augmenters as iaa
>>> import imgaug.parameters as iap
>>> aug = ReplaceElementwise(
>>> iap.FromLowerResolution(iap.Binomial(0.1), size_px=8),
>>> iap.Normal(128, 0.4*128),
>>> per_channel=0.5)
Replace ``10%`` of all pixels by gaussian noise centered around ``128``.
Sample the replacement mask at a lower resolution (``8x8`` pixels) and
upscale it to the image size, resulting in coarse areas being replaced by
gaussian noise.
"""
def __init__(self, mask, replacement, per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(ReplaceElementwise, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
self.mask = iap.handle_probability_param(
mask, "mask", tuple_to_uniform=True, list_to_choice=True)
self.replacement = iap.handle_continuous_param(replacement,
"replacement")
self.per_channel = iap.handle_probability_param(per_channel,
"per_channel")
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
if batch.images is None:
return batch
images = batch.images
nb_images = len(images)
rss = random_state.duplicate(1+2*nb_images)
per_channel_samples = self.per_channel.draw_samples(
(nb_images,), random_state=rss[0])
gen = enumerate(zip(images, per_channel_samples, rss[1::2], rss[2::2]))
for i, (image, per_channel_i, rs_mask, rs_replacement) in gen:
height, width, nb_channels = image.shape
sampling_shape = (height,
width,
nb_channels if per_channel_i > 0.5 else 1)
mask_samples = self.mask.draw_samples(sampling_shape,
random_state=rs_mask)
# TODO add separate per_channels for mask and replacement
# TODO add test that replacement with per_channel=False is not
# sampled per channel
if per_channel_i <= 0.5:
nb_channels = image.shape[-1]
replacement_samples = self.replacement.draw_samples(
(int(np.sum(mask_samples[:, :, 0])),),
random_state=rs_replacement)
# important here to use repeat instead of tile. repeat
# converts e.g. [0, 1, 2] to [0, 0, 1, 1, 2, 2], while tile
# leads to [0, 1, 2, 0, 1, 2]. The assignment below iterates
# over each channel and pixel simultaneously, *not* first
# over all pixels of channel 0, then all pixels in
# channel 1, ...
replacement_samples = np.repeat(replacement_samples,
nb_channels)
else:
replacement_samples = self.replacement.draw_samples(
(int(np.sum(mask_samples)),), random_state=rs_replacement)
batch.images[i] = replace_elementwise_(image, mask_samples,
replacement_samples)
return batch
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.mask, self.replacement, self.per_channel]
[docs]class SaltAndPepper(ReplaceElementwise):
"""
Replace pixels in images with salt/pepper noise (white/black-ish colors).
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.ReplaceElementwise`.
Parameters
----------
p : float or tuple of float or list of float or imgaug.parameters.StochasticParameter, optional
Probability of replacing a pixel to salt/pepper noise.
* If a float, then that value will always be used as the
probability.
* If a tuple ``(a, b)``, then a probability will be sampled
uniformly per image from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image.
* If a ``StochasticParameter``, then a image-sized mask will be
sampled from that parameter per image. Any value ``>0.5`` in
that mask will be replaced with salt and pepper noise.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.SaltAndPepper(0.05)
Replace ``5%`` of all pixels with salt and pepper noise.
>>> import imgaug.augmenters as iaa
>>> aug = iaa.SaltAndPepper(0.05, per_channel=True)
Replace *channelwise* ``5%`` of all pixels with salt and pepper
noise.
"""
def __init__(self, p=(0.0, 0.03), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(SaltAndPepper, self).__init__(
mask=p,
replacement=iap.Beta(0.5, 0.5) * 255,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
[docs]class ImpulseNoise(SaltAndPepper):
"""
Add impulse noise to images.
This is identical to ``SaltAndPepper``, except that `per_channel` is
always set to ``True``.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.SaltAndPepper`.
Parameters
----------
p : float or tuple of float or list of float or imgaug.parameters.StochasticParameter, optional
Probability of replacing a pixel to impulse noise.
* If a float, then that value will always be used as the
probability.
* If a tuple ``(a, b)``, then a probability will be sampled
uniformly per image from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image.
* If a ``StochasticParameter``, then a image-sized mask will be
sampled from that parameter per image. Any value ``>0.5`` in
that mask will be replaced with impulse noise noise.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.ImpulseNoise(0.1)
Replace ``10%`` of all pixels with impulse noise.
"""
def __init__(self, p=(0.0, 0.03),
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(ImpulseNoise, self).__init__(
p=p,
per_channel=True,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
[docs]class CoarseSaltAndPepper(ReplaceElementwise):
"""
Replace rectangular areas in images with white/black-ish pixel noise.
This adds salt and pepper noise (noisy white-ish and black-ish pixels) to
rectangular areas within the image. Note that this means that within these
rectangular areas the color varies instead of each rectangle having only
one color.
See also the similar ``CoarseDropout``.
TODO replace dtype support with uint8 only, because replacement is
geared towards that value range
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.ReplaceElementwise`.
Parameters
----------
p : float or tuple of float or list of float or imgaug.parameters.StochasticParameter, optional
Probability of changing a pixel to salt/pepper noise.
* If a float, then that value will always be used as the
probability.
* If a tuple ``(a, b)``, then a probability will be sampled
uniformly per image from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image.
* If a ``StochasticParameter``, then a lower-resolution mask will
be sampled from that parameter per image. Any value ``>0.5`` in
that mask will denote a spatial location that is to be replaced
by salt and pepper noise.
size_px : int or tuple of int or imgaug.parameters.StochasticParameter, optional
The size of the lower resolution image from which to sample the
replacement mask in absolute pixel dimensions.
Note that this means that *lower* values of this parameter lead to
*larger* areas being replaced (as any pixel in the lower resolution
image will correspond to a larger area at the original resolution).
* If ``None`` then `size_percent` must be set.
* If an integer, then that size will always be used for both height
and width. E.g. a value of ``3`` would lead to a ``3x3`` mask,
which is then upsampled to ``HxW``, where ``H`` is the image size
and ``W`` the image width.
* If a tuple ``(a, b)``, then two values ``M``, ``N`` will be
sampled from the discrete interval ``[a..b]``. The mask
will then be generated at size ``MxN`` and upsampled to ``HxW``.
* If a ``StochasticParameter``, then this parameter will be used to
determine the sizes. It is expected to be discrete.
size_percent : float or tuple of float or imgaug.parameters.StochasticParameter, optional
The size of the lower resolution image from which to sample the
replacement mask *in percent* of the input image.
Note that this means that *lower* values of this parameter lead to
*larger* areas being replaced (as any pixel in the lower resolution
image will correspond to a larger area at the original resolution).
* If ``None`` then `size_px` must be set.
* If a float, then that value will always be used as the percentage
of the height and width (relative to the original size). E.g. for
value ``p``, the mask will be sampled from ``(p*H)x(p*W)`` and
later upsampled to ``HxW``.
* If a tuple ``(a, b)``, then two values ``m``, ``n`` will be
sampled from the interval ``(a, b)`` and used as the size
fractions, i.e the mask size will be ``(m*H)x(n*W)``.
* If a ``StochasticParameter``, then this parameter will be used to
sample the percentage values. It is expected to be continuous.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
min_size : int, optional
Minimum height and width of the low resolution mask. If
`size_percent` or `size_px` leads to a lower value than this,
`min_size` will be used instead. This should never have a value of
less than ``2``, otherwise one may end up with a ``1x1`` low resolution
mask, leading easily to the whole image being replaced.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.CoarseSaltAndPepper(0.05, size_percent=(0.01, 0.1))
Marks ``5%`` of all pixels in a mask to be replaced by salt/pepper
noise. The mask has ``1%`` to ``10%`` the size of the input image.
The mask is then upscaled to the input image size, leading to large
rectangular areas being marked as to be replaced. These areas are then
replaced in the input image by salt/pepper noise.
>>> aug = iaa.CoarseSaltAndPepper(0.05, size_px=(4, 16))
Same as in the previous example, but the replacement mask before upscaling
has a size between ``4x4`` and ``16x16`` pixels (the axis sizes are sampled
independently, i.e. the mask may be rectangular).
>>> aug = iaa.CoarseSaltAndPepper(
>>> 0.05, size_percent=(0.01, 0.1), per_channel=True)
Same as in the first example, but mask and replacement are each sampled
independently per image channel.
"""
def __init__(self, p=(0.02, 0.1), size_px=None, size_percent=None,
per_channel=False, min_size=3,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
mask = iap.handle_probability_param(
p, "p", tuple_to_uniform=True, list_to_choice=True)
if size_px is not None:
mask_low = iap.FromLowerResolution(
other_param=mask, size_px=size_px, min_size=min_size)
elif size_percent is not None:
mask_low = iap.FromLowerResolution(
other_param=mask, size_percent=size_percent, min_size=min_size)
else:
mask_low = iap.FromLowerResolution(
other_param=mask, size_px=(3, 8), min_size=min_size)
replacement = iap.Beta(0.5, 0.5) * 255
super(CoarseSaltAndPepper, self).__init__(
mask=mask_low,
replacement=replacement,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
[docs]class Salt(ReplaceElementwise):
"""
Replace pixels in images with salt noise, i.e. white-ish pixels.
This augmenter is similar to ``SaltAndPepper``, but adds no pepper noise to
images.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.ReplaceElementwise`.
Parameters
----------
p : float or tuple of float or list of float or imgaug.parameters.StochasticParameter, optional
Probability of replacing a pixel with salt noise.
* If a float, then that value will always be used as the
probability.
* If a tuple ``(a, b)``, then a probability will be sampled
uniformly per image from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image.
* If a ``StochasticParameter``, then a image-sized mask will be
sampled from that parameter per image. Any value ``>0.5`` in
that mask will be replaced with salt noise.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Salt(0.05)
Replace ``5%`` of all pixels with salt noise (white-ish colors).
"""
def __init__(self, p=(0.0, 0.03), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
replacement01 = iap.ForceSign(
iap.Beta(0.5, 0.5) - 0.5,
positive=True,
mode="invert"
) + 0.5
# FIXME max replacement seems to essentially never exceed 254
replacement = replacement01 * 255
super(Salt, self).__init__(
mask=p,
replacement=replacement,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
[docs]class CoarseSalt(ReplaceElementwise):
"""
Replace rectangular areas in images with white-ish pixel noise.
See also the similar ``CoarseSaltAndPepper``.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.ReplaceElementwise`.
Parameters
----------
p : float or tuple of float or list of float or imgaug.parameters.StochasticParameter, optional
Probability of changing a pixel to salt noise.
* If a float, then that value will always be used as the
probability.
* If a tuple ``(a, b)``, then a probability will be sampled
uniformly per image from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image.
* If a ``StochasticParameter``, then a lower-resolution mask will
be sampled from that parameter per image. Any value ``>0.5`` in
that mask will denote a spatial location that is to be replaced
by salt noise.
size_px : int or tuple of int or imgaug.parameters.StochasticParameter, optional
The size of the lower resolution image from which to sample the
replacement mask in absolute pixel dimensions.
Note that this means that *lower* values of this parameter lead to
*larger* areas being replaced (as any pixel in the lower resolution
image will correspond to a larger area at the original resolution).
* If ``None`` then `size_percent` must be set.
* If an integer, then that size will always be used for both height
and width. E.g. a value of ``3`` would lead to a ``3x3`` mask,
which is then upsampled to ``HxW``, where ``H`` is the image size
and ``W`` the image width.
* If a tuple ``(a, b)``, then two values ``M``, ``N`` will be
sampled from the discrete interval ``[a..b]``. The mask
will then be generated at size ``MxN`` and upsampled to ``HxW``.
* If a ``StochasticParameter``, then this parameter will be used to
determine the sizes. It is expected to be discrete.
size_percent : float or tuple of float or imgaug.parameters.StochasticParameter, optional
The size of the lower resolution image from which to sample the
replacement mask *in percent* of the input image.
Note that this means that *lower* values of this parameter lead to
*larger* areas being replaced (as any pixel in the lower resolution
image will correspond to a larger area at the original resolution).
* If ``None`` then `size_px` must be set.
* If a float, then that value will always be used as the percentage
of the height and width (relative to the original size). E.g. for
value ``p``, the mask will be sampled from ``(p*H)x(p*W)`` and
later upsampled to ``HxW``.
* If a tuple ``(a, b)``, then two values ``m``, ``n`` will be
sampled from the interval ``(a, b)`` and used as the size
fractions, i.e the mask size will be ``(m*H)x(n*W)``.
* If a ``StochasticParameter``, then this parameter will be used to
sample the percentage values. It is expected to be continuous.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
min_size : int, optional
Minimum height and width of the low resolution mask. If
`size_percent` or `size_px` leads to a lower value than this,
`min_size` will be used instead. This should never have a value of
less than ``2``, otherwise one may end up with a ``1x1`` low resolution
mask, leading easily to the whole image being replaced.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.CoarseSalt(0.05, size_percent=(0.01, 0.1))
Mark ``5%`` of all pixels in a mask to be replaced by salt
noise. The mask has ``1%`` to ``10%`` the size of the input image.
The mask is then upscaled to the input image size, leading to large
rectangular areas being marked as to be replaced. These areas are then
replaced in the input image by salt noise.
"""
def __init__(self, p=(0.02, 0.1), size_px=None, size_percent=None,
per_channel=False, min_size=3,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
mask = iap.handle_probability_param(
p, "p", tuple_to_uniform=True, list_to_choice=True)
if size_px is not None:
mask_low = iap.FromLowerResolution(
other_param=mask, size_px=size_px, min_size=min_size)
elif size_percent is not None:
mask_low = iap.FromLowerResolution(
other_param=mask, size_percent=size_percent, min_size=min_size)
else:
mask_low = iap.FromLowerResolution(
other_param=mask, size_px=(3, 8), min_size=min_size)
replacement01 = iap.ForceSign(
iap.Beta(0.5, 0.5) - 0.5,
positive=True,
mode="invert"
) + 0.5
replacement = replacement01 * 255
super(CoarseSalt, self).__init__(
mask=mask_low,
replacement=replacement,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
[docs]class Pepper(ReplaceElementwise):
"""
Replace pixels in images with pepper noise, i.e. black-ish pixels.
This augmenter is similar to ``SaltAndPepper``, but adds no salt noise to
images.
This augmenter is similar to ``Dropout``, but slower and the black pixels
are not uniformly black.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.ReplaceElementwise`.
Parameters
----------
p : float or tuple of float or list of float or imgaug.parameters.StochasticParameter, optional
Probability of replacing a pixel with pepper noise.
* If a float, then that value will always be used as the
probability.
* If a tuple ``(a, b)``, then a probability will be sampled
uniformly per image from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image.
* If a ``StochasticParameter``, then a image-sized mask will be
sampled from that parameter per image. Any value ``>0.5`` in
that mask will be replaced with pepper noise.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Pepper(0.05)
Replace ``5%`` of all pixels with pepper noise (black-ish colors).
"""
def __init__(self, p=(0.0, 0.05), per_channel=False,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
replacement01 = iap.ForceSign(
iap.Beta(0.5, 0.5) - 0.5,
positive=False,
mode="invert"
) + 0.5
replacement = replacement01 * 255
super(Pepper, self).__init__(
mask=p,
replacement=replacement,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
[docs]class CoarsePepper(ReplaceElementwise):
"""
Replace rectangular areas in images with black-ish pixel noise.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.ReplaceElementwise`.
Parameters
----------
p : float or tuple of float or list of float or imgaug.parameters.StochasticParameter, optional
Probability of changing a pixel to pepper noise.
* If a float, then that value will always be used as the
probability.
* If a tuple ``(a, b)``, then a probability will be sampled
uniformly per image from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image.
* If a ``StochasticParameter``, then a lower-resolution mask will
be sampled from that parameter per image. Any value ``>0.5`` in
that mask will denote a spatial location that is to be replaced
by pepper noise.
size_px : int or tuple of int or imgaug.parameters.StochasticParameter, optional
The size of the lower resolution image from which to sample the
replacement mask in absolute pixel dimensions.
Note that this means that *lower* values of this parameter lead to
*larger* areas being replaced (as any pixel in the lower resolution
image will correspond to a larger area at the original resolution).
* If ``None`` then `size_percent` must be set.
* If an integer, then that size will always be used for both height
and width. E.g. a value of ``3`` would lead to a ``3x3`` mask,
which is then upsampled to ``HxW``, where ``H`` is the image size
and ``W`` the image width.
* If a tuple ``(a, b)``, then two values ``M``, ``N`` will be
sampled from the discrete interval ``[a..b]``. The mask
will then be generated at size ``MxN`` and upsampled to ``HxW``.
* If a ``StochasticParameter``, then this parameter will be used to
determine the sizes. It is expected to be discrete.
size_percent : float or tuple of float or imgaug.parameters.StochasticParameter, optional
The size of the lower resolution image from which to sample the
replacement mask *in percent* of the input image.
Note that this means that *lower* values of this parameter lead to
*larger* areas being replaced (as any pixel in the lower resolution
image will correspond to a larger area at the original resolution).
* If ``None`` then `size_px` must be set.
* If a float, then that value will always be used as the percentage
of the height and width (relative to the original size). E.g. for
value ``p``, the mask will be sampled from ``(p*H)x(p*W)`` and
later upsampled to ``HxW``.
* If a tuple ``(a, b)``, then two values ``m``, ``n`` will be
sampled from the interval ``(a, b)`` and used as the size
fractions, i.e the mask size will be ``(m*H)x(n*W)``.
* If a ``StochasticParameter``, then this parameter will be used to
sample the percentage values. It is expected to be continuous.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
min_size : int, optional
Minimum size of the low resolution mask, both width and height. If
`size_percent` or `size_px` leads to a lower value than this, `min_size`
will be used instead. This should never have a value of less than 2,
otherwise one may end up with a ``1x1`` low resolution mask, leading
easily to the whole image being replaced.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.CoarsePepper(0.05, size_percent=(0.01, 0.1))
Mark ``5%`` of all pixels in a mask to be replaced by pepper
noise. The mask has ``1%`` to ``10%`` the size of the input image.
The mask is then upscaled to the input image size, leading to large
rectangular areas being marked as to be replaced. These areas are then
replaced in the input image by pepper noise.
"""
def __init__(self, p=(0.02, 0.1), size_px=None, size_percent=None,
per_channel=False, min_size=3,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
mask = iap.handle_probability_param(
p, "p", tuple_to_uniform=True, list_to_choice=True)
if size_px is not None:
mask_low = iap.FromLowerResolution(
other_param=mask, size_px=size_px, min_size=min_size)
elif size_percent is not None:
mask_low = iap.FromLowerResolution(
other_param=mask, size_percent=size_percent, min_size=min_size)
else:
mask_low = iap.FromLowerResolution(
other_param=mask, size_px=(3, 8), min_size=min_size)
replacement01 = iap.ForceSign(
iap.Beta(0.5, 0.5) - 0.5,
positive=False,
mode="invert"
) + 0.5
replacement = replacement01 * 255
super(CoarsePepper, self).__init__(
mask=mask_low,
replacement=replacement,
per_channel=per_channel,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
[docs]class Invert(meta.Augmenter):
"""
Invert all values in images, e.g. turn ``5`` into ``255-5=250``.
For the standard value range of 0-255 it converts ``0`` to ``255``,
``255`` to ``0`` and ``10`` to ``(255-10)=245``.
Let ``M`` be the maximum value possible, ``m`` the minimum value possible,
``v`` a value. Then the distance of ``v`` to ``m`` is ``d=abs(v-m)`` and
the new value is given by ``v'=M-d``.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.invert_`.
Parameters
----------
p : float or imgaug.parameters.StochasticParameter, optional
The probability of an image to be inverted.
* If a float, then that probability will be used for all images,
i.e. `p` percent of all images will be inverted.
* If a ``StochasticParameter``, then that parameter will be queried
per image and is expected to return values in the interval
``[0.0, 1.0]``, where values ``>0.5`` mean that the image
is supposed to be inverted. Recommended to be some form of
``imgaug.parameters.Binomial``.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
min_value : None or number, optional
Minimum of the value range of input images, e.g. ``0`` for ``uint8``
images. If set to ``None``, the value will be automatically derived
from the image's dtype.
max_value : None or number, optional
Maximum of the value range of input images, e.g. ``255`` for ``uint8``
images. If set to ``None``, the value will be automatically derived
from the image's dtype.
threshold : None or number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
A threshold to use in order to invert only numbers above or below
the threshold. If ``None`` no thresholding will be used.
* If ``None``: No thresholding will be used.
* If ``number``: The value will be used for all images.
* If ``tuple`` ``(a, b)``: A value will be uniformly sampled per
image from the interval ``[a, b)``.
* If ``list``: A random value will be picked from the list per
image.
* If ``StochasticParameter``: Per batch of size ``N``, the
parameter will be queried once to return ``(N,)`` samples.
invert_above_threshold : bool or float or imgaug.parameters.StochasticParameter, optional
If ``True``, only values ``>=threshold`` will be inverted.
Otherwise, only values ``<threshold`` will be inverted.
If a ``number``, then expected to be in the interval ``[0.0, 1.0]`` and
denoting an imagewise probability. If a ``StochasticParameter`` then
``(N,)`` values will be sampled from the parameter per batch of size
``N`` and interpreted as ``True`` if ``>0.5``.
If `threshold` is ``None`` this parameter has no effect.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Invert(0.1)
Inverts the colors in ``10`` percent of all images.
>>> aug = iaa.Invert(0.1, per_channel=True)
Inverts the colors in ``10`` percent of all image channels. This may or
may not lead to multiple channels in an image being inverted.
>>> aug = iaa.Invert(0.1, per_channel=0.5)
Identical to the previous example, but the `per_channel` feature is only
active for 50 percent of all images.
"""
# when no custom min/max are chosen, all bool, uint, int and float dtypes
# should be invertable (float tested only up to 64bit)
# when chosing custom min/max:
# - bool makes no sense, not allowed
# - int and float must be increased in resolution if custom min/max values
# are chosen, hence they are limited to 32 bit and below
# - uint64 is converted by numpy's clip to float64, hence loss of accuracy
# - float16 seems to not be perfectly accurate, but still ok-ish -- was
# off by 10 for center value of range (float 16 min, 16), where float
# 16 min is around -65500
ALLOW_DTYPES_CUSTOM_MINMAX = [
np.dtype(dt) for dt in [
np.uint8, np.uint16, np.uint32,
np.int8, np.int16, np.int32,
np.float16, np.float32
]
]
def __init__(self, p=1, per_channel=False, min_value=None, max_value=None,
threshold=None, invert_above_threshold=0.5,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(Invert, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
# TODO allow list and tuple for p
self.p = iap.handle_probability_param(p, "p")
self.per_channel = iap.handle_probability_param(per_channel,
"per_channel")
self.min_value = min_value
self.max_value = max_value
if threshold is None:
self.threshold = None
else:
self.threshold = iap.handle_continuous_param(
threshold, "threshold", value_range=None, tuple_to_uniform=True,
list_to_choice=True)
self.invert_above_threshold = iap.handle_probability_param(
invert_above_threshold, "invert_above_threshold")
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
if batch.images is None:
return batch
samples = self._draw_samples(batch, random_state)
for i, image in enumerate(batch.images):
if 0 in image.shape:
continue
kwargs = {
"min_value": samples.min_value[i],
"max_value": samples.max_value[i],
"threshold": samples.threshold[i],
"invert_above_threshold": samples.invert_above_threshold[i]
}
if samples.per_channel[i]:
nb_channels = image.shape[2]
mask = samples.p[i, :nb_channels]
image[..., mask] = invert_(image[..., mask], **kwargs)
else:
if samples.p[i, 0]:
image[:, :, :] = invert_(image, **kwargs)
return batch
# Added in 0.4.0.
def _draw_samples(self, batch, random_state):
nb_images = batch.nb_rows
nb_channels = meta.estimate_max_number_of_channels(batch.images)
p = self.p.draw_samples((nb_images, nb_channels),
random_state=random_state)
p = (p > 0.5)
per_channel = self.per_channel.draw_samples((nb_images,),
random_state=random_state)
per_channel = (per_channel > 0.5)
min_value = [self.min_value] * nb_images
max_value = [self.max_value] * nb_images
if self.threshold is None:
threshold = [None] * nb_images
else:
threshold = self.threshold.draw_samples(
(nb_images,), random_state=random_state)
invert_above_threshold = self.invert_above_threshold.draw_samples(
(nb_images,), random_state=random_state)
invert_above_threshold = (invert_above_threshold > 0.5)
return _InvertSamples(
p=p,
per_channel=per_channel,
min_value=min_value,
max_value=max_value,
threshold=threshold,
invert_above_threshold=invert_above_threshold
)
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.p, self.per_channel, self.min_value, self.max_value,
self.threshold, self.invert_above_threshold]
# Added in 0.4.0.
class _InvertSamples(object):
# Added in 0.4.0.
def __init__(self, p, per_channel, min_value, max_value,
threshold, invert_above_threshold):
self.p = p
self.per_channel = per_channel
self.min_value = min_value
self.max_value = max_value
self.threshold = threshold
self.invert_above_threshold = invert_above_threshold
[docs]class Solarize(Invert):
"""Invert all pixel values above a threshold.
This is the same as :class:`Invert`, but sets a default threshold around
``128`` (+/- 64, decided per image) and default `invert_above_threshold`
to ``True`` (i.e. only values above the threshold will be inverted).
See :class:`Invert` for more details.
Added in 0.4.0.
**Supported dtypes**:
See :class:`~imgaug.augmenters.arithmetic.Invert`.
Parameters
----------
p : float or imgaug.parameters.StochasticParameter
See :class:`Invert`.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
See :class:`Invert`.
min_value : None or number, optional
See :class:`Invert`.
max_value : None or number, optional
See :class:`Invert`.
threshold : None or number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
See :class:`Invert`.
invert_above_threshold : bool or float or imgaug.parameters.StochasticParameter, optional
See :class:`Invert`.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.Solarize(0.5, threshold=(32, 128))
Invert the colors in ``50`` percent of all images for pixels with a
value between ``32`` and ``128`` or more. The threshold is sampled once
per image. The thresholding operation happens per channel.
"""
def __init__(self, p=1, per_channel=False, min_value=None, max_value=None,
threshold=(128-64, 128+64), invert_above_threshold=True,
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(Solarize, self).__init__(
p=p, per_channel=per_channel,
min_value=min_value, max_value=max_value,
threshold=threshold, invert_above_threshold=invert_above_threshold,
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
# TODO remove from examples
[docs]@ia.deprecated("imgaug.contrast.LinearContrast")
def ContrastNormalization(alpha=1.0, per_channel=False,
seed=None, name=None,
random_state="deprecated",
deterministic="deprecated"):
"""
Change the contrast of images.
dtype support:
See ``imgaug.augmenters.contrast.LinearContrast``.
Deprecated since 0.3.0.
Parameters
----------
alpha : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
Strength of the contrast normalization. Higher values than 1.0
lead to higher contrast, lower values decrease the contrast.
* If a number, then that value will be used for all images.
* If a tuple ``(a, b)``, then a value will be sampled per image
uniformly from the interval ``[a, b]`` and be used as the alpha
value.
* If a list, then a random value will be picked per image from
that list.
* If a ``StochasticParameter``, then this parameter will be used to
sample the alpha value per image.
per_channel : bool or float or imgaug.parameters.StochasticParameter, optional
Whether to use (imagewise) the same sample(s) for all
channels (``False``) or to sample value(s) for each channel (``True``).
Setting this to ``True`` will therefore lead to different
transformations per image *and* channel, otherwise only per image.
If this value is a float ``p``, then for ``p`` percent of all images
`per_channel` will be treated as ``True``.
If it is a ``StochasticParameter`` it is expected to produce samples
with values between ``0.0`` and ``1.0``, where values ``>0.5`` will
lead to per-channel behaviour (i.e. same as ``True``).
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> iaa.ContrastNormalization((0.5, 1.5))
Decreases oder improves contrast per image by a random factor between
``0.5`` and ``1.5``. The factor ``0.5`` means that any difference from
the center value (i.e. 128) will be halved, leading to less contrast.
>>> iaa.ContrastNormalization((0.5, 1.5), per_channel=0.5)
Same as before, but for 50 percent of all images the normalization is done
independently per channel (i.e. factors can vary per channel for the same
image). In the other 50 percent of all images, the factor is the same for
all channels.
"""
# pylint: disable=invalid-name
# placed here to avoid cyclic dependency
from . import contrast as contrast_lib
return contrast_lib.LinearContrast(
alpha=alpha, per_channel=per_channel,
seed=seed, name=name, random_state=random_state, deterministic=deterministic)
# TODO try adding per channel somehow
[docs]class JpegCompression(meta.Augmenter):
"""
Degrade the quality of images by JPEG-compressing them.
During JPEG compression, high frequency components (e.g. edges) are removed.
With low compression (strength) only the highest frequency components are
removed, while very high compression (strength) will lead to only the
lowest frequency components "surviving". This lowers the image quality.
For more details, see https://en.wikipedia.org/wiki/Compression_artifact.
Note that this augmenter still returns images as numpy arrays (i.e. saves
the images with JPEG compression and then reloads them into arrays). It
does not return the raw JPEG file content.
**Supported dtypes**:
See :func:`~imgaug.augmenters.arithmetic.compress_jpeg`.
Parameters
----------
compression : number or tuple of number or list of number or imgaug.parameters.StochasticParameter, optional
Degree of compression used during JPEG compression within value range
``[0, 100]``. Higher values denote stronger compression and will cause
low-frequency components to disappear. Note that JPEG's compression
strength is also often set as a *quality*, which is the inverse of this
parameter. Common choices for the *quality* setting are around 80 to 95,
depending on the image. This translates here to a *compression*
parameter of around 20 to 5.
* If a single number, then that value always will be used as the
compression.
* If a tuple ``(a, b)``, then the compression will be
a value sampled uniformly from the interval ``[a, b]``.
* If a list, then a random value will be sampled from that list
per image and used as the compression.
* If a ``StochasticParameter``, then ``N`` samples will be drawn
from that parameter per ``N`` input images, each representing the
compression for the ``n``-th image.
seed : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
name : None or str, optional
See :func:`~imgaug.augmenters.meta.Augmenter.__init__`.
random_state : None or int or imgaug.random.RNG or numpy.random.Generator or numpy.random.BitGenerator or numpy.random.SeedSequence or numpy.random.RandomState, optional
Old name for parameter `seed`.
Its usage will not yet cause a deprecation warning,
but it is still recommended to use `seed` now.
Outdated since 0.4.0.
deterministic : bool, optional
Deprecated since 0.4.0.
See method ``to_deterministic()`` for an alternative and for
details about what the "deterministic mode" actually does.
Examples
--------
>>> import imgaug.augmenters as iaa
>>> aug = iaa.JpegCompression(compression=(70, 99))
Remove high frequency components in images via JPEG compression with
a *compression strength* between ``70`` and ``99`` (randomly and
uniformly sampled per image). This corresponds to a (very low) *quality*
setting of ``1`` to ``30``.
"""
def __init__(self, compression=(0, 100),
seed=None, name=None,
random_state="deprecated", deterministic="deprecated"):
super(JpegCompression, self).__init__(
seed=seed, name=name,
random_state=random_state, deterministic=deterministic)
# will be converted to int during augmentation, which is why we allow
# floats here
self.compression = iap.handle_continuous_param(
compression, "compression",
value_range=(0, 100), tuple_to_uniform=True, list_to_choice=True)
# Added in 0.4.0.
def _augment_batch_(self, batch, random_state, parents, hooks):
if batch.images is None:
return batch
images = batch.images
nb_images = len(images)
samples = self.compression.draw_samples((nb_images,),
random_state=random_state)
for i, (image, sample) in enumerate(zip(images, samples)):
batch.images[i] = compress_jpeg(image, int(sample))
return batch
[docs] def get_parameters(self):
"""See :func:`~imgaug.augmenters.meta.Augmenter.get_parameters`."""
return [self.compression]