Add random_gaussian_blur layer (#20817)

shashaka · web-flow · commit 3e52ce9cd7ca · 2025-01-27T15:04:14.000-08:00
* Add random_gaussian_blur

* Update description and add test cases

* Correct failed test case
diff --git a/keras/api/_tf_keras/keras/layers/__init__.py b/keras/api/_tf_keras/keras/layers/__init__.py
@@ -178,6 +178,9 @@
 from keras.src.layers.preprocessing.image_preprocessing.random_flip import (
     RandomFlip,
 )
+from keras.src.layers.preprocessing.image_preprocessing.random_gaussian_blur import (
+    RandomGaussianBlur,
+)
 from keras.src.layers.preprocessing.image_preprocessing.random_grayscale import (
     RandomGrayscale,
 )
diff --git a/keras/api/layers/__init__.py b/keras/api/layers/__init__.py
@@ -178,6 +178,9 @@
 from keras.src.layers.preprocessing.image_preprocessing.random_flip import (
     RandomFlip,
 )
+from keras.src.layers.preprocessing.image_preprocessing.random_gaussian_blur import (
+    RandomGaussianBlur,
+)
 from keras.src.layers.preprocessing.image_preprocessing.random_grayscale import (
     RandomGrayscale,
 )
diff --git a/keras/src/layers/__init__.py b/keras/src/layers/__init__.py
@@ -122,6 +122,9 @@
 from keras.src.layers.preprocessing.image_preprocessing.random_flip import (
     RandomFlip,
 )
+from keras.src.layers.preprocessing.image_preprocessing.random_gaussian_blur import (
+    RandomGaussianBlur,
+)
 from keras.src.layers.preprocessing.image_preprocessing.random_grayscale import (
     RandomGrayscale,
 )
diff --git a/keras/src/layers/preprocessing/image_preprocessing/random_gaussian_blur.py b/keras/src/layers/preprocessing/image_preprocessing/random_gaussian_blur.py
@@ -0,0 +1,255 @@
+from keras.src.api_export import keras_export
+from keras.src.layers.preprocessing.image_preprocessing.base_image_preprocessing_layer import (  # noqa: E501
+    BaseImagePreprocessingLayer,
+)
+from keras.src.random import SeedGenerator
+
+
+@keras_export("keras.layers.RandomGaussianBlur")
+class RandomGaussianBlur(BaseImagePreprocessingLayer):
+    """Applies random Gaussian blur to images for data augmentation.
+
+    This layer performs a Gaussian blur operation on input images with a
+    randomly selected degree of blurring, controlled by the `factor` and
+    `sigma` arguments.
+
+    Args:
+        factor: A single float or a tuple of two floats.
+            `factor` controls the extent to which the image hue is impacted.
+            `factor=0.0` makes this layer perform a no-op operation,
+            while a value of `1.0` performs the most aggressive
+            blurring available. If a tuple is used, a `factor` is
+            sampled between the two values for every image augmented. If a
+            single float is used, a value between `0.0` and the passed float is
+            sampled. Default is 1.0.
+        kernel_size: Integer. Size of the Gaussian kernel used for blurring.
+            Must be an odd integer. Default is 3.
+        sigma: Float or tuple of two floats. Standard deviation of the Gaussian
+            kernel. Controls the intensity of the blur. If a tuple is provided,
+            a value is sampled between the two for each image. Default is 1.0.
+        value_range: the range of values the incoming images will have.
+            Represented as a two-number tuple written `[low, high]`. This is
+            typically either `[0, 1]` or `[0, 255]` depending on how your
+            preprocessing pipeline is set up.
+        seed: Integer. Used to create a random seed.
+    """
+
+    _USE_BASE_FACTOR = False
+    _FACTOR_BOUNDS = (0, 1)
+
+    def __init__(
+        self,
+        factor=1.0,
+        kernel_size=3,
+        sigma=1.0,
+        value_range=(0, 255),
+        data_format=None,
+        seed=None,
+        **kwargs,
+    ):
+        super().__init__(data_format=data_format, **kwargs)
+        self._set_factor(factor)
+        self.kernel_size = self._set_kernel_size(kernel_size, "kernel_size")
+        self.sigma = self._set_factor_by_name(sigma, "sigma")
+        self.value_range = value_range
+        self.seed = seed
+        self.generator = SeedGenerator(seed)
+
+    def _set_kernel_size(self, factor, name):
+        error_msg = f"{name} must be an odd number. Received: {name}={factor}"
+        if isinstance(factor, (tuple, list)):
+            if len(factor) != 2:
+                error_msg = (
+                    f"The `{name}` argument should be a number "
+                    "(or a list of two numbers) "
+                    f"Received: {name}={factor}"
+                )
+                raise ValueError(error_msg)
+            if (factor[0] % 2 == 0) or (factor[1] % 2 == 0):
+                raise ValueError(error_msg)
+            lower, upper = factor
+        elif isinstance(factor, (int, float)):
+            if factor % 2 == 0:
+                raise ValueError(error_msg)
+            lower, upper = factor, factor
+        else:
+            raise ValueError(error_msg)
+
+        return lower, upper
+
+    def _set_factor_by_name(self, factor, name):
+        error_msg = (
+            f"The `{name}` argument should be a number "
+            "(or a list of two numbers) "
+            "in the range "
+            f"[{self._FACTOR_BOUNDS[0]}, {self._FACTOR_BOUNDS[1]}]. "
+            f"Received: factor={factor}"
+        )
+        if isinstance(factor, (tuple, list)):
+            if len(factor) != 2:
+                raise ValueError(error_msg)
+            if (
+                factor[0] > self._FACTOR_BOUNDS[1]
+                or factor[1] < self._FACTOR_BOUNDS[0]
+            ):
+                raise ValueError(error_msg)
+            lower, upper = sorted(factor)
+        elif isinstance(factor, (int, float)):
+            if (
+                factor < self._FACTOR_BOUNDS[0]
+                or factor > self._FACTOR_BOUNDS[1]
+            ):
+                raise ValueError(error_msg)
+            factor = abs(factor)
+            lower, upper = [max(-factor, self._FACTOR_BOUNDS[0]), factor]
+        else:
+            raise ValueError(error_msg)
+        return lower, upper
+
+    def create_gaussian_kernel(self, kernel_size, sigma, num_channels):
+        def get_gaussian_kernel1d(size, sigma):
+            x = (
+                self.backend.numpy.arange(size, dtype=self.compute_dtype)
+                - (size - 1) / 2
+            )
+            kernel1d = self.backend.numpy.exp(-0.5 * (x / sigma) ** 2)
+            return kernel1d / self.backend.numpy.sum(kernel1d)
+
+        def get_gaussian_kernel2d(size, sigma):
+            kernel1d_x = get_gaussian_kernel1d(size[0], sigma[0])
+            kernel1d_y = get_gaussian_kernel1d(size[1], sigma[1])
+            return self.backend.numpy.tensordot(kernel1d_y, kernel1d_x, axes=0)
+
+        kernel = get_gaussian_kernel2d(kernel_size, sigma)
+
+        kernel = self.backend.numpy.reshape(
+            kernel, (kernel_size[0], kernel_size[1], 1, 1)
+        )
+        kernel = self.backend.numpy.tile(kernel, [1, 1, num_channels, 1])
+
+        kernel = self.backend.cast(kernel, self.compute_dtype)
+
+        return kernel
+
+    def get_random_transformation(self, data, training=True, seed=None):
+        if not training:
+            return None
+
+        if isinstance(data, dict):
+            images = data["images"]
+        else:
+            images = data
+
+        images_shape = self.backend.shape(images)
+        rank = len(images_shape)
+        if rank == 3:
+            batch_size = 1
+        elif rank == 4:
+            batch_size = images_shape[0]
+        else:
+            raise ValueError(
+                "Expected the input image to be rank 3 or 4. Received "
+                f"inputs.shape={images_shape}"
+            )
+
+        seed = seed or self._get_seed_generator(self.backend._backend)
+
+        blur_probability = self.backend.random.uniform(
+            shape=(batch_size,),
+            minval=self.factor[0],
+            maxval=self.factor[1],
+            seed=seed,
+        )
+
+        random_threshold = self.backend.random.uniform(
+            shape=(batch_size,),
+            minval=0.0,
+            maxval=1.0,
+            seed=seed,
+        )
+        should_apply_blur = random_threshold < blur_probability
+
+        blur_factor = (
+            self.backend.random.uniform(
+                shape=(2,),
+                minval=self.sigma[0],
+                maxval=self.sigma[1],
+                seed=seed,
+                dtype=self.compute_dtype,
+            )
+            + 1e-6
+        )
+
+        return {
+            "should_apply_blur": should_apply_blur,
+            "blur_factor": blur_factor,
+        }
+
+    def transform_images(self, images, transformation=None, training=True):
+        images = self.backend.cast(images, self.compute_dtype)
+        if training and transformation is not None:
+            if self.data_format == "channels_first":
+                images = self.backend.numpy.swapaxes(images, -3, -1)
+
+            blur_factor = transformation["blur_factor"]
+            should_apply_blur = transformation["should_apply_blur"]
+
+            kernel = self.create_gaussian_kernel(
+                self.kernel_size,
+                blur_factor,
+                self.backend.shape(images)[-1],
+            )
+
+            blur_images = self.backend.nn.depthwise_conv(
+                images,
+                kernel,
+                strides=1,
+                padding="same",
+                data_format="channels_last",
+            )
+
+            images = self.backend.numpy.where(
+                should_apply_blur[:, None, None, None],
+                blur_images,
+                images,
+            )
+
+            images = self.backend.numpy.clip(
+                images, self.value_range[0], self.value_range[1]
+            )
+
+            if self.data_format == "channels_first":
+                images = self.backend.numpy.swapaxes(images, -3, -1)
+
+            images = self.backend.cast(images, dtype=self.compute_dtype)
+
+        return images
+
+    def transform_labels(self, labels, transformation, training=True):
+        return labels
+
+    def transform_segmentation_masks(
+        self, segmentation_masks, transformation, training=True
+    ):
+        return segmentation_masks
+
+    def transform_bounding_boxes(
+        self, bounding_boxes, transformation, training=True
+    ):
+        return bounding_boxes
+
+    def compute_output_shape(self, input_shape):
+        return input_shape
+
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "factor": self.factor,
+                "kernel_size": self.kernel_size,
+                "sigma": self.sigma,
+                "value_range": self.value_range,
+                "seed": self.seed,
+            }
+        )
+        return config
diff --git a/keras/src/layers/preprocessing/image_preprocessing/random_gaussian_blur_test.py b/keras/src/layers/preprocessing/image_preprocessing/random_gaussian_blur_test.py
@@ -0,0 +1,91 @@
+import numpy as np
+import pytest
+from tensorflow import data as tf_data
+
+from keras.src import backend
+from keras.src import layers
+from keras.src import testing
+from keras.src.backend import convert_to_tensor
+
+
+class RandomGaussianBlurTest(testing.TestCase):
+    @pytest.mark.requires_trainable_backend
+    def test_layer(self):
+        self.run_layer_test(
+            layers.RandomGaussianBlur,
+            init_kwargs={
+                "factor": 1.0,
+                "kernel_size": 3,
+                "sigma": 0,
+                "value_range": (0, 255),
+                "seed": 1,
+            },
+            input_shape=(8, 3, 4, 3),
+            supports_masking=False,
+            expected_output_shape=(8, 3, 4, 3),
+        )
+
+    def test_random_erasing_inference(self):
+        seed = 3481
+        layer = layers.RandomGaussianBlur()
+
+        np.random.seed(seed)
+        inputs = np.random.randint(0, 255, size=(224, 224, 3))
+        output = layer(inputs, training=False)
+        self.assertAllClose(inputs, output)
+
+    def test_random_erasing_no_op(self):
+        seed = 3481
+        layer = layers.RandomGaussianBlur(factor=0)
+
+        np.random.seed(seed)
+        inputs = np.random.randint(0, 255, size=(224, 224, 3))
+        output = layer(inputs)
+        self.assertAllClose(inputs, output)
+
+    def test_random_erasing_basic(self):
+        data_format = backend.config.image_data_format()
+        if data_format == "channels_last":
+            inputs = np.ones((1, 2, 2, 3))
+            expected_output = np.asarray(
+                [
+                    [
+                        [[0.7273, 0.7273, 0.7273], [0.7273, 0.7273, 0.7273]],
+                        [[0.7273, 0.7273, 0.7273], [0.7273, 0.7273, 0.7273]],
+                    ]
+                ]
+            )
+
+        else:
+            inputs = np.ones((1, 3, 2, 2))
+            expected_output = np.asarray(
+                [
+                    [
+                        [[0.7273, 0.7273], [0.7273, 0.7273]],
+                        [[0.7273, 0.7273], [0.7273, 0.7273]],
+                        [[0.7273, 0.7273], [0.7273, 0.7273]],
+                    ]
+                ]
+            )
+
+        layer = layers.RandomGaussianBlur(data_format=data_format)
+
+        transformation = {
+            "blur_factor": convert_to_tensor([0.3732, 0.8654]),
+            "should_apply_blur": convert_to_tensor([True]),
+        }
+        output = layer.transform_images(inputs, transformation)
+
+        self.assertAllClose(expected_output, output, atol=1e-4, rtol=1e-4)
+
+    def test_tf_data_compatibility(self):
+        data_format = backend.config.image_data_format()
+        if data_format == "channels_last":
+            input_data = np.random.random((2, 8, 8, 3))
+        else:
+            input_data = np.random.random((2, 3, 8, 8))
+        layer = layers.RandomGaussianBlur(data_format=data_format)
+
+        ds = tf_data.Dataset.from_tensor_slices(input_data).batch(2).map(layer)
+        for output in ds.take(1):
+            output.numpy()

Original file line number	Diff line number	Diff line change
`@@ -178,6 +178,9 @@`
`178`	`178`	`from keras.src.layers.preprocessing.image_preprocessing.random_flip import (`
`179`	`179`	`RandomFlip,`
`180`	`180`	`)`
	`181`	`+from keras.src.layers.preprocessing.image_preprocessing.random_gaussian_blur import (`
	`182`	`+ RandomGaussianBlur,`
	`183`	`+)`
`181`	`184`	`from keras.src.layers.preprocessing.image_preprocessing.random_grayscale import (`
`182`	`185`	`RandomGrayscale,`
`183`	`186`	`)`
Original file line number	Diff line number	Diff line change
`@@ -122,6 +122,9 @@`
`122`	`122`	`from keras.src.layers.preprocessing.image_preprocessing.random_flip import (`
`123`	`123`	`RandomFlip,`
`124`	`124`	`)`
	`125`	`+from keras.src.layers.preprocessing.image_preprocessing.random_gaussian_blur import (`
	`126`	`+ RandomGaussianBlur,`
	`127`	`+)`
`125`	`128`	`from keras.src.layers.preprocessing.image_preprocessing.random_grayscale import (`
`126`	`129`	`RandomGrayscale,`
`127`	`130`	`)`