Blur transforms (augmentations.blur.transforms)¶
class AdvancedBlur
(blur_limit=(3, 7), sigma_x_limit=(0.2, 1.0), sigma_y_limit=(0.2, 1.0), sigmaX_limit=None, sigmaY_limit=None, rotate_limit=90, beta_limit=(0.5, 8.0), noise_limit=(0.9, 1.1), always_apply=False, p=0.5)
[view source on GitHub] ¶
Blurs the input image using a Generalized Normal filter with randomly selected parameters.
This transform also adds multiplicative noise to the generated kernel before convolution, affecting the image in a unique way that combines blurring and noise injection for enhanced data augmentation.
Parameters:
Name | Type | Description |
---|---|---|
blur_limit | ScaleIntType | Maximum Gaussian kernel size for blurring the input image. Must be zero or odd and in range [0, inf). If set to 0, it will be computed from sigma as |
sigma_x_limit | ScaleFloatType | Gaussian kernel standard deviation for the X dimension. Must be in range [0, inf). If a single value is provided, |
sigma_y_limit | ScaleFloatType | Gaussian kernel standard deviation for the Y dimension. Must follow the same rules as |
rotate_limit | ScaleIntType | Range from which a random angle used to rotate the Gaussian kernel is picked. If limit is a single int, an angle is picked from (-rotate_limit, rotate_limit). Defaults to (-90, 90). |
beta_limit | ScaleFloatType | Distribution shape parameter. 1 represents the normal distribution. Values below 1.0 make distribution tails heavier than normal, and values above 1.0 make it lighter than normal. Defaults to (0.5, 8.0). |
noise_limit | ScaleFloatType | Multiplicative factor that controls the strength of kernel noise. Must be positive and preferably centered around 1.0. If a single value is provided, |
p | float | Probability of applying the transform. Defaults to 0.5. |
Reference
"Real-ESRGAN: Training Real-World Blind Super-Resolution with Pure Synthetic Data", available at https://arxiv.org/abs/2107.10833
Targets
image
Image types: uint8, float32
Source code in albumentations/augmentations/blur/transforms.py
class AdvancedBlur(ImageOnlyTransform):
"""Blurs the input image using a Generalized Normal filter with randomly selected parameters.
This transform also adds multiplicative noise to the generated kernel before convolution,
affecting the image in a unique way that combines blurring and noise injection for enhanced
data augmentation.
Args:
blur_limit (ScaleIntType, optional): Maximum Gaussian kernel size for blurring the input image.
Must be zero or odd and in range [0, inf). If set to 0, it will be computed from sigma
as `round(sigma * (3 if img.dtype == np.uint8 else 4) * 2 + 1) + 1`.
If a single value is provided, `blur_limit` will be in the range (0, blur_limit).
Defaults to (3, 7).
sigma_x_limit ScaleFloatType: Gaussian kernel standard deviation for the X dimension.
Must be in range [0, inf). If a single value is provided, `sigma_x_limit` will be in the range
(0, sigma_limit). If set to 0, sigma will be computed as `sigma = 0.3*((ksize-1)*0.5 - 1) + 0.8`.
Defaults to (0.2, 1.0).
sigma_y_limit ScaleFloatType: Gaussian kernel standard deviation for the Y dimension.
Must follow the same rules as `sigma_x_limit`.
Defaults to (0.2, 1.0).
rotate_limit (ScaleIntType, optional): Range from which a random angle used to rotate the Gaussian kernel
is picked. If limit is a single int, an angle is picked from (-rotate_limit, rotate_limit).
Defaults to (-90, 90).
beta_limit (ScaleFloatType, optional): Distribution shape parameter. 1 represents the normal distribution.
Values below 1.0 make distribution tails heavier than normal, and values above 1.0 make it
lighter than normal.
Defaults to (0.5, 8.0).
noise_limit (ScaleFloatType, optional): Multiplicative factor that controls the strength of kernel noise.
Must be positive and preferably centered around 1.0. If a single value is provided,
`noise_limit` will be in the range (0, noise_limit).
Defaults to (0.75, 1.25).
p (float, optional): Probability of applying the transform.
Defaults to 0.5.
Reference:
"Real-ESRGAN: Training Real-World Blind Super-Resolution with Pure Synthetic Data",
available at https://arxiv.org/abs/2107.10833
Targets:
image
Image types:
uint8, float32
"""
class InitSchema(BlurInitSchema):
sigma_x_limit: NonNegativeFloatRangeType = (0.2, 1.0)
sigma_y_limit: NonNegativeFloatRangeType = (0.2, 1.0)
beta_limit: NonNegativeFloatRangeType = (0.5, 8.0)
noise_limit: NonNegativeFloatRangeType = (0.75, 1.25)
rotate_limit: SymmetricRangeType = (-90, 90)
@field_validator("beta_limit")
@classmethod
def check_beta_limit(cls, value: ScaleFloatType) -> Tuple[float, float]:
result = to_tuple(value, low=0)
if not (result[0] < 1.0 < result[1]):
msg = "beta_limit is expected to include 1.0."
raise ValueError(msg)
return result
@model_validator(mode="after")
def validate_limits(self) -> Self:
if (
isinstance(self.sigma_x_limit, (tuple, list))
and self.sigma_x_limit[0] == 0
and isinstance(self.sigma_y_limit, (tuple, list))
and self.sigma_y_limit[0] == 0
):
msg = "sigma_x_limit and sigma_y_limit minimum value cannot be both equal to 0."
raise ValueError(msg)
return self
def __init__(
self,
blur_limit: ScaleIntType = (3, 7),
sigma_x_limit: ScaleFloatType = (0.2, 1.0),
sigma_y_limit: ScaleFloatType = (0.2, 1.0),
sigmaX_limit: Optional[ScaleFloatType] = None, # noqa: N803
sigmaY_limit: Optional[ScaleFloatType] = None, # noqa: N803
rotate_limit: ScaleIntType = 90,
beta_limit: ScaleFloatType = (0.5, 8.0),
noise_limit: ScaleFloatType = (0.9, 1.1),
always_apply: bool = False,
p: float = 0.5,
):
super().__init__(always_apply, p)
if sigmaX_limit is not None:
warnings.warn("sigmaX_limit is deprecated; use sigma_x_limit instead.", DeprecationWarning)
sigma_x_limit = sigmaX_limit
if sigmaY_limit is not None:
warnings.warn("sigmaY_limit is deprecated; use sigma_y_limit instead.", DeprecationWarning)
sigma_y_limit = sigmaY_limit
self.blur_limit = cast(Tuple[int, int], blur_limit)
self.sigma_x_limit = cast(Tuple[float, float], sigma_x_limit)
self.sigma_y_limit = cast(Tuple[float, float], sigma_y_limit)
self.rotate_limit = cast(Tuple[int, int], rotate_limit)
self.beta_limit = cast(Tuple[float, float], beta_limit)
self.noise_limit = cast(Tuple[float, float], noise_limit)
def apply(self, img: np.ndarray, kernel: Optional[np.ndarray] = None, **params: Any) -> np.ndarray:
return FMain.convolve(img, kernel=kernel)
def get_params(self) -> Dict[str, np.ndarray]:
ksize = random.randrange(self.blur_limit[0], self.blur_limit[1] + 1, 2)
sigma_x = random_utils.uniform(*self.sigma_x_limit)
sigma_y = random_utils.uniform(*self.sigma_y_limit)
angle = np.deg2rad(random.uniform(*self.rotate_limit))
# Split into 2 cases to avoid selection of narrow kernels (beta > 1) too often.
beta = (
random.uniform(self.beta_limit[0], 1) if random.random() < HALF else random.uniform(1, self.beta_limit[1])
)
noise_matrix = random_utils.uniform(self.noise_limit[0], self.noise_limit[1], size=[ksize, ksize])
# Generate mesh grid centered at zero.
ax = np.arange(-ksize // 2 + 1.0, ksize // 2 + 1.0)
# > Shape (ksize, ksize, 2)
grid = np.stack(np.meshgrid(ax, ax), axis=-1)
# Calculate rotated sigma matrix
d_matrix = np.array([[sigma_x**2, 0], [0, sigma_y**2]])
u_matrix = np.array([[np.cos(angle), -np.sin(angle)], [np.sin(angle), np.cos(angle)]])
sigma_matrix = np.dot(u_matrix, np.dot(d_matrix, u_matrix.T))
inverse_sigma = np.linalg.inv(sigma_matrix)
# Described in "Parameter Estimation For Multivariate Generalized Gaussian Distributions"
kernel = np.exp(-0.5 * np.power(np.sum(np.dot(grid, inverse_sigma) * grid, 2), beta))
# Add noise
kernel *= noise_matrix
# Normalize kernel
kernel = kernel.astype(np.float32) / np.sum(kernel)
return {"kernel": kernel}
def get_transform_init_args_names(self) -> Tuple[str, str, str, str, str, str]:
return (
"blur_limit",
"sigma_x_limit",
"sigma_y_limit",
"rotate_limit",
"beta_limit",
"noise_limit",
)
apply (self, img, kernel=None, **params)
¶
get_params (self)
¶
Returns parameters independent of input
Source code in albumentations/augmentations/blur/transforms.py
def get_params(self) -> Dict[str, np.ndarray]:
ksize = random.randrange(self.blur_limit[0], self.blur_limit[1] + 1, 2)
sigma_x = random_utils.uniform(*self.sigma_x_limit)
sigma_y = random_utils.uniform(*self.sigma_y_limit)
angle = np.deg2rad(random.uniform(*self.rotate_limit))
# Split into 2 cases to avoid selection of narrow kernels (beta > 1) too often.
beta = (
random.uniform(self.beta_limit[0], 1) if random.random() < HALF else random.uniform(1, self.beta_limit[1])
)
noise_matrix = random_utils.uniform(self.noise_limit[0], self.noise_limit[1], size=[ksize, ksize])
# Generate mesh grid centered at zero.
ax = np.arange(-ksize // 2 + 1.0, ksize // 2 + 1.0)
# > Shape (ksize, ksize, 2)
grid = np.stack(np.meshgrid(ax, ax), axis=-1)
# Calculate rotated sigma matrix
d_matrix = np.array([[sigma_x**2, 0], [0, sigma_y**2]])
u_matrix = np.array([[np.cos(angle), -np.sin(angle)], [np.sin(angle), np.cos(angle)]])
sigma_matrix = np.dot(u_matrix, np.dot(d_matrix, u_matrix.T))
inverse_sigma = np.linalg.inv(sigma_matrix)
# Described in "Parameter Estimation For Multivariate Generalized Gaussian Distributions"
kernel = np.exp(-0.5 * np.power(np.sum(np.dot(grid, inverse_sigma) * grid, 2), beta))
# Add noise
kernel *= noise_matrix
# Normalize kernel
kernel = kernel.astype(np.float32) / np.sum(kernel)
return {"kernel": kernel}
get_transform_init_args_names (self)
¶
Returns names of arguments that are used in init method of the transform
class Blur
(blur_limit=7, always_apply=False, p=0.5)
[view source on GitHub] ¶
Blur the input image using a random-sized kernel.
Parameters:
Name | Type | Description |
---|---|---|
blur_limit | Union[int, Tuple[int, int]] | maximum kernel size for blurring the input image. Should be in range [3, inf). Default: (3, 7). |
p | float | probability of applying the transform. Default: 0.5. |
Targets
image
Image types: uint8, float32
Source code in albumentations/augmentations/blur/transforms.py
class Blur(ImageOnlyTransform):
"""Blur the input image using a random-sized kernel.
Args:
blur_limit: maximum kernel size for blurring the input image.
Should be in range [3, inf). Default: (3, 7).
p: probability of applying the transform. Default: 0.5.
Targets:
image
Image types:
uint8, float32
"""
class InitSchema(BlurInitSchema):
pass
def __init__(self, blur_limit: ScaleIntType = 7, always_apply: bool = False, p: float = 0.5):
super().__init__(always_apply, p)
self.blur_limit = cast(Tuple[int, int], blur_limit)
def apply(self, img: np.ndarray, kernel: int = 3, **params: Any) -> np.ndarray:
return F.blur(img, kernel)
def get_params(self) -> Dict[str, Any]:
return {"ksize": int(random.choice(list(range(self.blur_limit[0], self.blur_limit[1] + 1, 2))))}
def get_transform_init_args_names(self) -> Tuple[str, ...]:
return ("blur_limit",)
class Defocus
(radius=(3, 10), alias_blur=(0.1, 0.5), always_apply=False, p=0.5)
[view source on GitHub] ¶
Apply defocus transform.
Parameters:
Name | Type | Description |
---|---|---|
radius | int, int) or int | range for radius of defocusing. If limit is a single int, the range will be [1, limit]. Default: (3, 10). |
alias_blur | float, float) or float | range for alias_blur of defocusing (sigma of gaussian blur). If limit is a single float, the range will be (0, limit). Default: (0.1, 0.5). |
p | float | probability of applying the transform. Default: 0.5. |
Targets
image
Image types: unit8, float32
Reference
Source code in albumentations/augmentations/blur/transforms.py
class Defocus(ImageOnlyTransform):
"""Apply defocus transform.
Args:
radius ((int, int) or int): range for radius of defocusing.
If limit is a single int, the range will be [1, limit]. Default: (3, 10).
alias_blur ((float, float) or float): range for alias_blur of defocusing (sigma of gaussian blur).
If limit is a single float, the range will be (0, limit). Default: (0.1, 0.5).
p (float): probability of applying the transform. Default: 0.5.
Targets:
image
Image types:
unit8, float32
Reference:
https://arxiv.org/abs/1903.12261
"""
class InitSchema(BaseTransformInitSchema):
radius: OnePlusIntRangeType = (3, 10)
alias_blur: NonNegativeFloatRangeType = (0.1, 0.5)
def __init__(
self,
radius: ScaleIntType = (3, 10),
alias_blur: ScaleFloatType = (0.1, 0.5),
always_apply: bool = False,
p: float = 0.5,
):
super().__init__(always_apply, p)
self.radius = cast(Tuple[int, int], radius)
self.alias_blur = cast(Tuple[float, float], alias_blur)
def apply(self, img: np.ndarray, radius: int = 3, alias_blur: float = 0.5, **params: Any) -> np.ndarray:
return F.defocus(img, radius, alias_blur)
def get_params(self) -> Dict[str, Any]:
return {
"radius": random_utils.randint(self.radius[0], self.radius[1] + 1),
"alias_blur": random_utils.uniform(self.alias_blur[0], self.alias_blur[1]),
}
def get_transform_init_args_names(self) -> Tuple[str, str]:
return ("radius", "alias_blur")
class GaussianBlur
(blur_limit=(3, 7), sigma_limit=0, always_apply=False, p=0.5)
[view source on GitHub] ¶
Blur the input image using a Gaussian filter with a random kernel size.
Parameters:
Name | Type | Description |
---|---|---|
blur_limit | int, (int, int | maximum Gaussian kernel size for blurring the input image. Must be zero or odd and in range [0, inf). If set to 0 it will be computed from sigma as |
sigma_limit | float, (float, float | Gaussian kernel standard deviation. Must be in range [0, inf). If set single value |
p | float | probability of applying the transform. Default: 0.5. |
Targets
image
Image types: uint8, float32
Source code in albumentations/augmentations/blur/transforms.py
class GaussianBlur(ImageOnlyTransform):
"""Blur the input image using a Gaussian filter with a random kernel size.
Args:
blur_limit (int, (int, int)): maximum Gaussian kernel size for blurring the input image.
Must be zero or odd and in range [0, inf). If set to 0 it will be computed from sigma
as `round(sigma * (3 if img.dtype == np.uint8 else 4) * 2 + 1) + 1`.
If set single value `blur_limit` will be in range (0, blur_limit).
Default: (3, 7).
sigma_limit (float, (float, float)): Gaussian kernel standard deviation. Must be in range [0, inf).
If set single value `sigma_limit` will be in range (0, sigma_limit).
If set to 0 sigma will be computed as `sigma = 0.3*((ksize-1)*0.5 - 1) + 0.8`. Default: 0.
p (float): probability of applying the transform. Default: 0.5.
Targets:
image
Image types:
uint8, float32
"""
class InitSchema(BlurInitSchema):
sigma_limit: NonNegativeFloatRangeType = 0
@field_validator("blur_limit")
@classmethod
def process_blur(cls, value: ScaleIntType, info: ValidationInfo) -> Tuple[int, int]:
return process_blur_limit(value, info, min_value=0)
@model_validator(mode="after")
def validate_limits(self) -> Self:
if (
isinstance(self.blur_limit, (tuple, list))
and self.blur_limit[0] == 0
and isinstance(self.sigma_limit, (tuple, list))
and self.sigma_limit[0] == 0
):
self.blur_limit = 3, max(3, self.blur_limit[1])
warnings.warn(
"blur_limit and sigma_limit minimum value can not be both equal to 0. "
"blur_limit minimum value changed to 3.",
)
if isinstance(self.blur_limit, tuple):
for v in self.blur_limit:
if v != 0 and v % 2 != 1:
raise ValueError(f"Blur limit must be 0 or odd. Got: {self.blur_limit}")
return self
def __init__(
self,
blur_limit: ScaleIntType = (3, 7),
sigma_limit: ScaleFloatType = 0,
always_apply: bool = False,
p: float = 0.5,
):
super().__init__(always_apply, p)
self.blur_limit = cast(Tuple[int, int], blur_limit)
self.sigma_limit = cast(Tuple[float, float], sigma_limit)
def apply(self, img: np.ndarray, ksize: int = 3, sigma: float = 0, **params: Any) -> np.ndarray:
return F.gaussian_blur(img, ksize, sigma=sigma)
def get_params(self) -> Dict[str, float]:
ksize = random.randrange(self.blur_limit[0], self.blur_limit[1] + 1)
if ksize != 0 and ksize % 2 != 1:
ksize = (ksize + 1) % (self.blur_limit[1] + 1)
return {"ksize": ksize, "sigma": random.uniform(*self.sigma_limit)}
def get_transform_init_args_names(self) -> Tuple[str, str]:
return ("blur_limit", "sigma_limit")
class GlassBlur
(sigma=0.7, max_delta=4, iterations=2, mode='fast', always_apply=False, p=0.5)
[view source on GitHub] ¶
Apply glass noise to the input image.
Parameters:
Name | Type | Description |
---|---|---|
sigma | float | standard deviation for Gaussian kernel. |
max_delta | int | max distance between pixels which are swapped. |
iterations | int | number of repeats. Should be in range [1, inf). Default: (2). |
mode | str | mode of computation: fast or exact. Default: "fast". |
p | float | probability of applying the transform. Default: 0.5. |
Targets
image
Image types: uint8, float32
Reference
https://arxiv.org/abs/1903.12261 https://github.com/hendrycks/robustness/blob/master/ImageNet-C/create_c/make_imagenet_c.py
Source code in albumentations/augmentations/blur/transforms.py
class GlassBlur(ImageOnlyTransform):
"""Apply glass noise to the input image.
Args:
sigma (float): standard deviation for Gaussian kernel.
max_delta (int): max distance between pixels which are swapped.
iterations (int): number of repeats.
Should be in range [1, inf). Default: (2).
mode (str): mode of computation: fast or exact. Default: "fast".
p (float): probability of applying the transform. Default: 0.5.
Targets:
image
Image types:
uint8, float32
Reference:
https://arxiv.org/abs/1903.12261
https://github.com/hendrycks/robustness/blob/master/ImageNet-C/create_c/make_imagenet_c.py
"""
class InitSchema(BaseTransformInitSchema):
sigma: float = Field(default=0.7, ge=0, description="Standard deviation for the Gaussian kernel.")
max_delta: int = Field(default=4, ge=1, description="Maximum distance between pixels that are swapped.")
iterations: int = Field(default=2, ge=1, description="Number of times the glass noise effect is applied.")
mode: Literal["fast", "exact"] = "fast"
def __init__(
self,
sigma: float = 0.7,
max_delta: int = 4,
iterations: int = 2,
mode: Literal["fast", "exact"] = "fast",
always_apply: bool = False,
p: float = 0.5,
):
super().__init__(always_apply=always_apply, p=p)
self.sigma = sigma
self.max_delta = max_delta
self.iterations = iterations
self.mode = mode
def apply(self, img: np.ndarray, *args: Any, dxy: np.ndarray = None, **params: Any) -> np.ndarray:
if dxy is None:
msg = "dxy is None"
raise ValueError(msg)
return F.glass_blur(img, self.sigma, self.max_delta, self.iterations, dxy, self.mode)
def get_params_dependent_on_targets(self, params: Dict[str, Any]) -> Dict[str, np.ndarray]:
img = params["image"]
height, width = img.shape[:2]
# generate array containing all necessary values for transformations
width_pixels = height - self.max_delta * 2
height_pixels = width - self.max_delta * 2
total_pixels = int(width_pixels * height_pixels)
dxy = random_utils.randint(-self.max_delta, self.max_delta, size=(total_pixels, self.iterations, 2))
return {"dxy": dxy}
def get_transform_init_args_names(self) -> Tuple[str, str, str, str]:
return ("sigma", "max_delta", "iterations", "mode")
@property
def targets_as_params(self) -> List[str]:
return ["image"]
targets_as_params: List[str]
property
readonly
¶
Targets used to get params
apply (self, img, *args, *, dxy=None, **params)
¶
Apply transform on image.
Source code in albumentations/augmentations/blur/transforms.py
get_params_dependent_on_targets (self, params)
¶
Returns parameters dependent on targets. Dependent target is defined in self.targets_as_params
Source code in albumentations/augmentations/blur/transforms.py
def get_params_dependent_on_targets(self, params: Dict[str, Any]) -> Dict[str, np.ndarray]:
img = params["image"]
height, width = img.shape[:2]
# generate array containing all necessary values for transformations
width_pixels = height - self.max_delta * 2
height_pixels = width - self.max_delta * 2
total_pixels = int(width_pixels * height_pixels)
dxy = random_utils.randint(-self.max_delta, self.max_delta, size=(total_pixels, self.iterations, 2))
return {"dxy": dxy}
get_transform_init_args_names (self)
¶
class MedianBlur
(blur_limit=7, always_apply=False, p=0.5)
[view source on GitHub] ¶
Blur the input image using a median filter with a random aperture linear size.
Parameters:
Name | Type | Description |
---|---|---|
blur_limit | int | maximum aperture linear size for blurring the input image. Must be odd and in range [3, inf). Default: (3, 7). |
p | float | probability of applying the transform. Default: 0.5. |
Targets
image
Image types: uint8, float32
Source code in albumentations/augmentations/blur/transforms.py
class MedianBlur(Blur):
"""Blur the input image using a median filter with a random aperture linear size.
Args:
blur_limit (int): maximum aperture linear size for blurring the input image.
Must be odd and in range [3, inf). Default: (3, 7).
p (float): probability of applying the transform. Default: 0.5.
Targets:
image
Image types:
uint8, float32
"""
def __init__(self, blur_limit: ScaleIntType = 7, always_apply: bool = False, p: float = 0.5):
super().__init__(blur_limit, always_apply, p)
def apply(self, img: np.ndarray, kernel: int = 3, **params: Any) -> np.ndarray:
return F.median_blur(img, kernel)
class MotionBlur
(blur_limit=7, allow_shifted=True, always_apply=False, p=0.5)
[view source on GitHub] ¶
Apply motion blur to the input image using a random-sized kernel.
Parameters:
Name | Type | Description |
---|---|---|
blur_limit | int | maximum kernel size for blurring the input image. Should be in range [3, inf). Default: (3, 7). |
allow_shifted | bool | if set to true creates non shifted kernels only, otherwise creates randomly shifted kernels. Default: True. |
p | float | probability of applying the transform. Default: 0.5. |
Targets
image
Image types: uint8, float32
Source code in albumentations/augmentations/blur/transforms.py
class MotionBlur(Blur):
"""Apply motion blur to the input image using a random-sized kernel.
Args:
blur_limit (int): maximum kernel size for blurring the input image.
Should be in range [3, inf). Default: (3, 7).
allow_shifted (bool): if set to true creates non shifted kernels only,
otherwise creates randomly shifted kernels. Default: True.
p (float): probability of applying the transform. Default: 0.5.
Targets:
image
Image types:
uint8, float32
"""
class InitSchema(BaseTransformInitSchema):
allow_shifted: bool = Field(
default=True,
description="If set to true creates non-shifted kernels only, otherwise creates randomly shifted kernels.",
)
blur_limit: ScaleIntType = Field(
default=(3, 7),
description="Maximum kernel size for blurring the input image.",
)
@model_validator(mode="after")
def process_blur(self) -> Self:
self.blur_limit = cast(Tuple[int, int], to_tuple(self.blur_limit, 3))
if self.allow_shifted and isinstance(self.blur_limit, tuple) and any(x % 2 != 1 for x in self.blur_limit):
raise ValueError(f"Blur limit must be odd when centered=True. Got: {self.blur_limit}")
return self
def __init__(
self,
blur_limit: ScaleIntType = 7,
allow_shifted: bool = True,
always_apply: bool = False,
p: float = 0.5,
):
super().__init__(blur_limit=blur_limit, always_apply=always_apply, p=p)
self.allow_shifted = allow_shifted
self.blur_limit = cast(Tuple[int, int], blur_limit)
def get_transform_init_args_names(self) -> Tuple[str, ...]:
return (*super().get_transform_init_args_names(), "allow_shifted")
def apply(self, img: np.ndarray, kernel: Optional[np.ndarray] = None, **params: Any) -> np.ndarray:
return FMain.convolve(img, kernel=kernel)
def get_params(self) -> Dict[str, Any]:
ksize = random.choice(list(range(self.blur_limit[0], self.blur_limit[1] + 1, 2)))
if ksize <= TWO:
raise ValueError(f"ksize must be > 2. Got: {ksize}")
kernel = np.zeros((ksize, ksize), dtype=np.uint8)
x1, x2 = random.randint(0, ksize - 1), random.randint(0, ksize - 1)
if x1 == x2:
y1, y2 = random.sample(range(ksize), 2)
else:
y1, y2 = random.randint(0, ksize - 1), random.randint(0, ksize - 1)
def make_odd_val(v1: int, v2: int) -> Tuple[int, int]:
len_v = abs(v1 - v2) + 1
if len_v % 2 != 1:
if v2 > v1:
v2 -= 1
else:
v1 -= 1
return v1, v2
if not self.allow_shifted:
x1, x2 = make_odd_val(x1, x2)
y1, y2 = make_odd_val(y1, y2)
xc = (x1 + x2) / 2
yc = (y1 + y2) / 2
center = ksize / 2 - 0.5
dx = xc - center
dy = yc - center
x1, x2 = (int(i - dx) for i in [x1, x2])
y1, y2 = (int(i - dy) for i in [y1, y2])
cv2.line(kernel, (x1, y1), (x2, y2), 1, thickness=1)
# Normalize kernel
return {"kernel": kernel.astype(np.float32) / np.sum(kernel)}
apply (self, img, kernel=None, **params)
¶
get_params (self)
¶
Returns parameters independent of input
Source code in albumentations/augmentations/blur/transforms.py
def get_params(self) -> Dict[str, Any]:
ksize = random.choice(list(range(self.blur_limit[0], self.blur_limit[1] + 1, 2)))
if ksize <= TWO:
raise ValueError(f"ksize must be > 2. Got: {ksize}")
kernel = np.zeros((ksize, ksize), dtype=np.uint8)
x1, x2 = random.randint(0, ksize - 1), random.randint(0, ksize - 1)
if x1 == x2:
y1, y2 = random.sample(range(ksize), 2)
else:
y1, y2 = random.randint(0, ksize - 1), random.randint(0, ksize - 1)
def make_odd_val(v1: int, v2: int) -> Tuple[int, int]:
len_v = abs(v1 - v2) + 1
if len_v % 2 != 1:
if v2 > v1:
v2 -= 1
else:
v1 -= 1
return v1, v2
if not self.allow_shifted:
x1, x2 = make_odd_val(x1, x2)
y1, y2 = make_odd_val(y1, y2)
xc = (x1 + x2) / 2
yc = (y1 + y2) / 2
center = ksize / 2 - 0.5
dx = xc - center
dy = yc - center
x1, x2 = (int(i - dx) for i in [x1, x2])
y1, y2 = (int(i - dy) for i in [y1, y2])
cv2.line(kernel, (x1, y1), (x2, y2), 1, thickness=1)
# Normalize kernel
return {"kernel": kernel.astype(np.float32) / np.sum(kernel)}
get_transform_init_args_names (self)
¶
class ZoomBlur
(max_factor=(1, 1.31), step_factor=(0.01, 0.03), always_apply=False, p=0.5)
[view source on GitHub] ¶
Apply zoom blur transform.
Parameters:
Name | Type | Description |
---|---|---|
max_factor | float, float) or float | range for max factor for blurring. If max_factor is a single float, the range will be (1, limit). Default: (1, 1.31). All max_factor values should be larger than 1. |
step_factor | float, float) or float | If single float will be used as step parameter for np.arange. If tuple of float step_factor will be in range |
p | float | probability of applying the transform. Default: 0.5. |
Targets
image
Image types: unit8, float32
Reference
Source code in albumentations/augmentations/blur/transforms.py
class ZoomBlur(ImageOnlyTransform):
"""Apply zoom blur transform.
Args:
max_factor ((float, float) or float): range for max factor for blurring.
If max_factor is a single float, the range will be (1, limit). Default: (1, 1.31).
All max_factor values should be larger than 1.
step_factor ((float, float) or float): If single float will be used as step parameter for np.arange.
If tuple of float step_factor will be in range `[step_factor[0], step_factor[1])`. Default: (0.01, 0.03).
All step_factor values should be positive.
p (float): probability of applying the transform. Default: 0.5.
Targets:
image
Image types:
unit8, float32
Reference:
https://arxiv.org/abs/1903.12261
"""
class InitSchema(BaseTransformInitSchema):
max_factor: OnePlusFloatRangeType = (1, 1.31)
step_factor: NonNegativeFloatRangeType = (0.01, 0.03)
def __init__(
self,
max_factor: ScaleFloatType = (1, 1.31),
step_factor: ScaleFloatType = (0.01, 0.03),
always_apply: bool = False,
p: float = 0.5,
):
super().__init__(always_apply, p)
self.max_factor = cast(Tuple[float, float], max_factor)
self.step_factor = cast(Tuple[float, float], step_factor)
def apply(self, img: np.ndarray, zoom_factors: Optional[np.ndarray] = None, **params: Any) -> np.ndarray:
if zoom_factors is None:
msg = "zoom_factors is None"
raise ValueError(msg)
return F.zoom_blur(img, zoom_factors)
def get_params(self) -> Dict[str, Any]:
max_factor = random.uniform(self.max_factor[0], self.max_factor[1])
step_factor = random.uniform(self.step_factor[0], self.step_factor[1])
return {"zoom_factors": np.arange(1.0, max_factor, step_factor)}
def get_transform_init_args_names(self) -> Tuple[str, str]:
return ("max_factor", "step_factor")