Add implementations for mix_up (keras-team#20590)

* Add implementations for mix_up * Add updated init files * Applied some corrections * Remove sample beta method * Add test cases * Correct failed test cases * Correct failed test cases * Add tf compatibility test case * Update example in the code * Fix failed test case
SamanehSaadat · Dec 9, 2024 · 9b1159f · 9b1159f
1 parent 38b9b9c
commit 9b1159f
Show file tree

Hide file tree

Showing 5 changed files with 212 additions and 0 deletions.
diff --git a/keras/api/_tf_keras/keras/layers/__init__.py b/keras/api/_tf_keras/keras/layers/__init__.py
@@ -151,6 +151,7 @@
 from keras.src.layers.preprocessing.image_preprocessing.max_num_bounding_box import (
     MaxNumBoundingBoxes,
 )
+from keras.src.layers.preprocessing.image_preprocessing.mix_up import MixUp
 from keras.src.layers.preprocessing.image_preprocessing.random_brightness import (
     RandomBrightness,
 )

diff --git a/keras/api/layers/__init__.py b/keras/api/layers/__init__.py
@@ -151,6 +151,7 @@
 from keras.src.layers.preprocessing.image_preprocessing.max_num_bounding_box import (
     MaxNumBoundingBoxes,
 )
+from keras.src.layers.preprocessing.image_preprocessing.mix_up import MixUp
 from keras.src.layers.preprocessing.image_preprocessing.random_brightness import (
     RandomBrightness,
 )

diff --git a/keras/src/layers/__init__.py b/keras/src/layers/__init__.py
@@ -94,6 +94,7 @@
 from keras.src.layers.preprocessing.image_preprocessing.max_num_bounding_box import (
     MaxNumBoundingBoxes,
 )
+from keras.src.layers.preprocessing.image_preprocessing.mix_up import MixUp
 from keras.src.layers.preprocessing.image_preprocessing.random_brightness import (
     RandomBrightness,
 )

diff --git a/keras/src/layers/preprocessing/image_preprocessing/mix_up.py b/keras/src/layers/preprocessing/image_preprocessing/mix_up.py
@@ -0,0 +1,146 @@
+import keras.src.random.random
+from keras.src.api_export import keras_export
+from keras.src.layers.preprocessing.image_preprocessing.base_image_preprocessing_layer import (  # noqa: E501
+    BaseImagePreprocessingLayer,
+)
+from keras.src.random import SeedGenerator
+
+
+@keras_export("keras.layers.MixUp")
+class MixUp(BaseImagePreprocessingLayer):
+    """MixUp implements the MixUp data augmentation technique.
+
+    Args:
+        alpha: Float between 0 and 1. Controls the blending strength.
+               Smaller values mean less mixing, while larger values allow
+               for more  blending between images. Defaults to 0.2,
+               recommended for ImageNet1k classification.
+        seed: Integer. Used to create a random seed.
+
+    References:
+        - [MixUp paper](https://arxiv.org/abs/1710.09412).
+        - [MixUp for Object Detection paper](https://arxiv.org/pdf/1902.04103).
+
+    Example:
+    ```python
+    (images, labels), _ = keras.datasets.cifar10.load_data()
+    images, labels = images[:10], labels[:10]
+    # Labels must be floating-point and one-hot encoded
+    labels = tf.cast(tf.one_hot(labels, 10), tf.float32)
+    mixup = keras.layers.MixUp(alpha=0.2)
+    augmented_images, updated_labels = mixup(
+        {'images': images, 'labels': labels}
+    )
+    # output == {'images': updated_images, 'labels': updated_labels}
+    ```
+    """
+
+    def __init__(self, alpha=0.2, data_format=None, seed=None, **kwargs):
+        super().__init__(data_format=None, **kwargs)
+        self.alpha = alpha
+        self.seed = seed
+        self.generator = SeedGenerator(seed)
+
+    def get_random_transformation(self, data, training=True, seed=None):
+        if isinstance(data, dict):
+            images = data["images"]
+        else:
+            images = data
+
+        images_shape = self.backend.shape(images)
+
+        if len(images_shape) == 3:
+            batch_size = 1
+        else:
+            batch_size = self.backend.shape(images)[0]
+
+        permutation_order = self.backend.random.shuffle(
+            self.backend.numpy.arange(0, batch_size, dtype="int64"),
+            seed=self.generator,
+        )
+
+        mix_weight = keras.src.random.random.beta(
+            (1,), self.alpha, self.alpha, seed=self.generator
+        )
+        return {
+            "mix_weight": mix_weight,
+            "permutation_order": permutation_order,
+        }
+
+    def transform_images(self, images, transformation=None, training=True):
+        mix_weight = transformation["mix_weight"]
+        permutation_order = transformation["permutation_order"]
+
+        mix_weight = self.backend.cast(
+            self.backend.numpy.reshape(mix_weight, [-1, 1, 1, 1]),
+            dtype=self.compute_dtype,
+        )
+
+        mixup_images = self.backend.cast(
+            self.backend.numpy.take(images, permutation_order, axis=0),
+            dtype=self.compute_dtype,
+        )
+
+        images = mix_weight * images + (1.0 - mix_weight) * mixup_images
+
+        return images
+
+    def transform_labels(self, labels, transformation, training=True):
+        mix_weight = transformation["mix_weight"]
+        permutation_order = transformation["permutation_order"]
+
+        labels_for_mixup = self.backend.numpy.take(
+            labels, permutation_order, axis=0
+        )
+
+        mix_weight = self.backend.numpy.reshape(mix_weight, [-1, 1])
+
+        labels = mix_weight * labels + (1.0 - mix_weight) * labels_for_mixup
+
+        return labels
+
+    def transform_bounding_boxes(
+        self,
+        bounding_boxes,
+        transformation,
+        training=True,
+    ):
+        permutation_order = transformation["permutation_order"]
+        boxes, classes = bounding_boxes["boxes"], bounding_boxes["classes"]
+        boxes_for_mixup = self.backend.numpy.take(boxes, permutation_order)
+        classes_for_mixup = self.backend.numpy.take(classes, permutation_order)
+        boxes = self.backend.numpy.concat([boxes, boxes_for_mixup], axis=1)
+        classes = self.backend.numpy.concat(
+            [classes, classes_for_mixup], axis=1
+        )
+        return {"boxes": boxes, "classes": classes}
+
+    def transform_segmentation_masks(
+        self, segmentation_masks, transformation, training=True
+    ):
+        mix_weight = transformation["mix_weight"]
+        permutation_order = transformation["permutation_order"]
+
+        mix_weight = self.backend.numpy.reshape(mix_weight, [-1, 1, 1, 1])
+
+        segmentation_masks_for_mixup = self.backend.numpy.take(
+            segmentation_masks, permutation_order
+        )
+
+        segmentation_masks = (
+            mix_weight * segmentation_masks
+            + (1.0 - mix_weight) * segmentation_masks_for_mixup
+        )
+
+        return segmentation_masks
+
+    def compute_output_shape(self, input_shape):
+        return input_shape
+
+    def get_config(self):
+        config = {
+            "alpha": self.alpha,
+            "seed": self.seed,
+        }
+        base_config = super().get_config()
+        return {**base_config, **config}
diff --git a/keras/src/layers/preprocessing/image_preprocessing/mix_up_test.py b/keras/src/layers/preprocessing/image_preprocessing/mix_up_test.py
@@ -0,0 +1,63 @@
+import numpy as np
+import pytest
+from tensorflow import data as tf_data
+
+from keras.src import layers
+from keras.src import testing
+
+
+class MixUpTest(testing.TestCase):
+    @pytest.mark.requires_trainable_backend
+    def test_layer(self):
+        self.run_layer_test(
+            layers.MixUp,
+            init_kwargs={
+                "alpha": 0.2,
+            },
+            input_shape=(8, 3, 4, 3),
+            supports_masking=False,
+            expected_output_shape=(8, 3, 4, 3),
+        )
+
+    def test_mix_up_basic_functionality(self):
+        image = np.random.random((64, 64, 3))
+        mix_up_layer = layers.MixUp(alpha=1)
+        transformation = {"mix_weight": 1, "permutation_order": [0]}
+        output = mix_up_layer.transform_images(
+            image, transformation=transformation
+        )[0]
+        self.assertAllClose(output, image)
+
+        image = np.random.random((4, 64, 64, 3))
+        mix_up_layer = layers.MixUp(alpha=0.2)
+        transformation = {"mix_weight": 0.2, "permutation_order": [1, 0, 2, 3]}
+        output = mix_up_layer.transform_images(
+            image, transformation=transformation
+        )
+        self.assertNotAllClose(output, image)
+        self.assertAllClose(output.shape, image.shape)
+
+    def test_mix_up_basic_functionality_channel_first(self):
+        image = np.random.random((3, 64, 64))
+        mix_up_layer = layers.MixUp(alpha=1)
+        transformation = {"mix_weight": 1, "permutation_order": [0]}
+        output = mix_up_layer.transform_images(
+            image, transformation=transformation
+        )[0]
+        self.assertAllClose(output, image)
+
+        image = np.random.random((4, 3, 64, 64))
+        mix_up_layer = layers.MixUp(alpha=0.2)
+        transformation = {"mix_weight": 0.2, "permutation_order": [1, 0, 2, 3]}
+        output = mix_up_layer.transform_images(
+            image, transformation=transformation
+        )
+        self.assertNotAllClose(output, image)
+        self.assertAllClose(output.shape, image.shape)
+
+    def test_tf_data_compatibility(self):
+        layer = layers.MixUp()
+        input_data = np.random.random((2, 8, 8, 3))
+        ds = tf_data.Dataset.from_tensor_slices(input_data).batch(2).map(layer)
+        for output in ds.take(1):
+            output.numpy()