add apply_to_images (#2560)

trylinka · web-flow · commit 3db139d5c5b8 · 2025-06-17T16:05:53.000-07:00
* add apply_to_images

* test for generate_noise

* Refactor generate_noise tests to avoid conditionals using pytest.mark.parametrize

* Fix processing for batches

* optimized add_noise for batch

* removed unused tests

* removed unused tests
diff --git a/albumentations/augmentations/pixel/functional.py b/albumentations/augmentations/pixel/functional.py
@@ -2301,7 +2301,10 @@ def add_noise(img: np.ndarray, noise: np.ndarray) -> np.ndarray:
         np.ndarray: The noise added to the image.
 
     """
-    return add(img, noise, inplace=False)
+    n_tiles = np.prod(img.shape) // np.prod(noise.shape)
+    noise = np.tile(noise, (n_tiles,) + (1,) * noise.ndim).reshape(img.shape)
+
+    return add_array(img, noise, inplace=False)
 
 
 def slic(
diff --git a/albumentations/augmentations/pixel/transforms.py b/albumentations/augmentations/pixel/transforms.py
@@ -21,6 +21,7 @@
     MAX_VALUES_BY_DTYPE,
     NUM_MULTI_CHANNEL_DIMENSIONS,
     batch_transform,
+    get_image_data,
     get_num_channels,
     is_grayscale_image,
     is_rgb_image,
@@ -2631,6 +2632,39 @@ def apply(
         """
         return fpixel.add_noise(img, noise_map)
 
+    def apply_to_images(self, images: np.ndarray, noise_map: np.ndarray, **params: Any) -> np.ndarray:
+        """Apply the Gaussian noise to a batch of images.
+
+        Args:
+            images (np.ndarray): The batch of images to apply the Gaussian noise to.
+            noise_map (np.ndarray): The noise map to apply to the images.
+            **params (Any): Additional parameters (not used in this transform).
+
+        """
+        return fpixel.add_noise(images, noise_map)
+
+    def apply_to_volume(self, volume: np.ndarray, noise_map: np.ndarray, **params: Any) -> np.ndarray:
+        """Apply the Gaussian noise to a single volume.
+
+        Args:
+            volume (np.ndarray): The volume to apply the Gaussian noise to.
+            noise_map (np.ndarray): The noise map to apply to the volume.
+            **params (Any): Additional parameters (not used in this transform).
+
+        """
+        return fpixel.add_noise(volume, noise_map)
+
+    def apply_to_volumes(self, volumes: np.ndarray, noise_map: np.ndarray, **params: Any) -> np.ndarray:
+        """Apply the Gaussian noise to a batch of volumes.
+
+        Args:
+            volumes (np.ndarray): The batch of volumes to apply the Gaussian noise to.
+            noise_map (np.ndarray): The noise map to apply to the volumes.
+            **params (Any): Additional parameters (not used in this transform).
+
+        """
+        return fpixel.add_noise(volumes, noise_map)
+
     def get_params_dependent_on_data(
         self,
         params: dict[str, Any],
@@ -2647,17 +2681,17 @@ def get_params_dependent_on_data(
                 - "noise_map" (np.ndarray): The noise map to apply to the image.
 
         """
-        image = data["image"] if "image" in data else data["images"][0]
-        max_value = MAX_VALUES_BY_DTYPE[image.dtype]
+        metadata = get_image_data(data)
+        max_value = MAX_VALUES_BY_DTYPE[metadata["dtype"]]
+        shape = (metadata["height"], metadata["width"], metadata["num_channels"])
 
         sigma = self.py_random.uniform(*self.std_range)
-
         mean = self.py_random.uniform(*self.mean_range)
 
         noise_map = fpixel.generate_noise(
             noise_type="gaussian",
             spatial_mode="per_pixel" if self.per_channel else "shared",
-            shape=image.shape,
+            shape=shape,
             params={"mean_range": (mean, mean), "std_range": (sigma, sigma)},
             max_value=max_value,
             approximation=self.noise_scale_factor,
@@ -6036,14 +6070,14 @@ def get_params_dependent_on_data(
             data (dict[str, Any]): The data to apply the transform to.
 
         """
-        image = data["image"] if "image" in data else data["images"][0]
-
-        max_value = MAX_VALUES_BY_DTYPE[image.dtype]
+        metadata = get_image_data(data)
+        max_value = MAX_VALUES_BY_DTYPE[metadata["dtype"]]
+        shape = (metadata["height"], metadata["width"], metadata["num_channels"])
 
         noise_map = fpixel.generate_noise(
             noise_type=self.noise_type,
             spatial_mode=self.spatial_mode,
-            shape=image.shape,
+            shape=shape,
             params=self.noise_params,
             max_value=max_value,
             approximation=self.approximation,
@@ -6180,7 +6214,7 @@ class SaltAndPepper(ImageOnlyTransform):
     """Apply salt and pepper noise to the input image.
 
     Salt and pepper noise is a form of impulse noise that randomly sets pixels to either maximum value (salt)
-    or minimum value (pepper). The amount and proportion of salt vs pepper noise can be controlled.
+    or minimum value (pepper). The amount and proportion of salt vs pepper can be controlled.
     The same noise mask is applied to all channels of the image to preserve color consistency.
 
     Args:
@@ -6283,8 +6317,7 @@ def get_params_dependent_on_data(
             data (dict[str, Any]): The data to apply the transform to.
 
         """
-        image = data["image"] if "image" in data else data["images"][0]
-        height, width = image.shape[:2]
+        height, width = params["shape"][:2]
 
         total_amount = self.py_random.uniform(*self.amount)
         salt_ratio = self.py_random.uniform(*self.salt_vs_pepper)
diff --git a/setup.py b/setup.py
@@ -8,7 +8,7 @@
     "PyYAML",
     "typing-extensions>=4.9.0; python_version<'3.10'",
     "pydantic>=2.9.2",
-    "albucore==0.0.26",
+    "albucore==0.0.28",
     "eval-type-backport; python_version<'3.10'",
 ]
 
diff --git a/tests/functional/test_functional.py b/tests/functional/test_functional.py
@@ -23,6 +23,7 @@
 from tests.utils import convert_2d_to_target_format
 from copy import deepcopy
 from sklearn.decomposition import NMF
+from typing import Any
 
 
 @pytest.mark.parametrize(

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@`
`8`	`8`	`"PyYAML",`
`9`	`9`	`"typing-extensions>=4.9.0; python_version<'3.10'",`
`10`	`10`	`"pydantic>=2.9.2",`
`11`		`- "albucore==0.0.26",`
	`11`	`+ "albucore==0.0.28",`
`12`	`12`	`"eval-type-backport; python_version<'3.10'",`
`13`	`13`	`]`
`14`	`14`