Trusted-AI · beat-buesser · Jun 13, 2023 · Apr 27, 2023 · Apr 27, 2023 · May 3, 2023
diff --git a/art/defences/preprocessor/preprocessor.py b/art/defences/preprocessor/preprocessor.py
@@ -80,7 +80,7 @@ def apply_predict(self) -> bool:
         return self._apply_predict
 
     @abc.abstractmethod
-    def __call__(self, x: np.ndarray, y: Optional[np.ndarray] = None) -> Tuple[np.ndarray, Optional[np.ndarray]]:
+    def __call__(self, x: np.ndarray, y: Optional[Any] = None) -> Tuple[np.ndarray, Optional[Any]]:
         """
         Perform data preprocessing and return preprocessed data as tuple.
 
@@ -250,7 +250,7 @@ class PreprocessorTensorFlowV2(Preprocessor):
     """
 
     @abc.abstractmethod
-    def forward(self, x: "tf.Tensor", y: Optional["tf.Tensor"] = None) -> Tuple["tf.Tensor", Optional["tf.Tensor"]]:
+    def forward(self, x: "tf.Tensor", y: Optional[Any] = None) -> Tuple["tf.Tensor", Optional[Any]]:
         """
         Perform data preprocessing in TensorFlow v2 and return preprocessed data as tuple.
 

diff --git a/art/preprocessing/image/__init__.py b/art/preprocessing/image/__init__.py
@@ -0,0 +1,9 @@
+"""
+This module contains image preprocessing tools.
+"""
+from art.preprocessing.image.image_resize.numpy import ImageResize
+from art.preprocessing.image.image_resize.pytorch import ImageResizePyTorch
+from art.preprocessing.image.image_resize.tensorflow import ImageResizeTensorFlowV2
+from art.preprocessing.image.image_square_pad.numpy import ImageSquarePad
+from art.preprocessing.image.image_square_pad.pytorch import ImageSquarePadPyTorch
+from art.preprocessing.image.image_square_pad.tensorflow import ImageSquarePadTensorFlowV2
diff --git a/art/preprocessing/image/image_resize/__init__.py b/art/preprocessing/image/image_resize/__init__.py
diff --git a/art/preprocessing/image/image_resize/numpy.py b/art/preprocessing/image/image_resize/numpy.py
@@ -0,0 +1,154 @@
+# MIT License
+#
+# Copyright (C) The Adversarial Robustness Toolbox (ART) Authors 2023
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated
+# documentation files (the "Software"), to deal in the Software without restriction, including without limitation the
+# rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit
+# persons to whom the Software is furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all copies or substantial portions of the
+# Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
+# WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
+# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+"""
+This module implements resizing for images and object detection bounding boxes.
+"""
+import logging
+from typing import Dict, List, Optional, TYPE_CHECKING, Tuple, Union
+
+import numpy as np
+import cv2
+from tqdm.auto import tqdm
+
+from art.preprocessing.preprocessing import Preprocessor
+
+if TYPE_CHECKING:
+    from art.utils import CLIP_VALUES_TYPE
+
+logger = logging.getLogger(__name__)
+
+
+class ImageResize(Preprocessor):
+    """
+    This module implements resizing for images and object detection bounding boxes.
+    """
+
+    params = ["height", "width", "channels_first", "label_type", "interpolation", "clip_values", "verbose"]
+
+    label_types = ["classification", "object_detection"]
+
+    def __init__(
+        self,
+        height: int,
+        width: int,
+        channels_first: bool = False,
+        label_type: str = "classification",
+        interpolation: int = cv2.INTER_LINEAR,
+        clip_values: Optional["CLIP_VALUES_TYPE"] = None,
+        apply_fit: bool = True,
+        apply_predict: bool = False,
+        verbose: bool = False,
+    ):
+        """
+        Create an instance of ImageResize.
+
+        :param height: The height of the resized image.
+        :param width: The width of the resized image.
+        :param channels_first: Set channels first or last.
+        :param label_type: String defining the label type. Currently supported: `classification`, `object_detection`
+        :param interpolation: The desired method to resize the image defined by the `cv2::InterpolationFlags` enum.
+        :param clip_values: Tuple of the form `(min, max)` representing the minimum and maximum values allowed
+               for features.
+        :param apply_fit: True if applied during fitting/training.
+        :param apply_predict: True if applied during predicting.
+        :param verbose: Show progress bars.
+        """
+        super().__init__(is_fitted=True, apply_fit=apply_fit, apply_predict=apply_predict)
+        self.height = height
+        self.width = width
+        self.channels_first = channels_first
+        self.label_type = label_type
+        self.interpolation = interpolation
+        self.clip_values = clip_values
+        self.verbose = verbose
+        self._check_params()
+
+    def __call__(
+        self, x: np.ndarray, y: Optional[Union[np.ndarray, List[Dict[str, np.ndarray]]]] = None
+    ) -> Tuple[np.ndarray, Optional[Union[np.ndarray, List[Dict[str, np.ndarray]]]]]:
+        """
+        Resize `x` and adjust bounding boxes for labels `y` accordingly.
+
+        :param x: Input samples. A list of samples is also supported.
+        :param y: Label of the samples `x`.
+        :return: Transformed samples and labels.
+        """
+        x_preprocess_list = []
+        y_preprocess: Optional[Union[np.ndarray, List[Dict[str, np.ndarray]]]]
+        if y is not None and self.label_type == "object_detection":
+            y_preprocess = []
+        else:
+            y_preprocess = y
+
+        for i, x_i in enumerate(tqdm(x, desc="ImageResize", disable=not self.verbose)):
+            if self.channels_first:
+                x_i = np.transpose(x_i, (1, 2, 0))
+
+            # Resize image: OpenCV swaps height and width
+            x_resized = cv2.resize(x_i, (self.width, self.height), interpolation=self.interpolation)
+
+            if self.channels_first:
+                x_resized = np.transpose(x_resized, (2, 0, 1))
+
+            x_preprocess_list.append(x_resized)
+
+            if self.label_type == "object_detection" and y is not None:
+                y_resized: Dict[str, np.ndarray] = {}
+
+                # Copy labels and ensure types
+                if isinstance(y, list) and isinstance(y_preprocess, list):
+                    y_i = y[i]
+                    if isinstance(y_i, dict):
+                        y_resized = {k: np.copy(v) for k, v in y_i.items()}
+                    else:
+                        raise TypeError("Wrong type for `y` and label_type=object_detection.")
+                else:
+                    raise TypeError("Wrong type for `y` and label_type=object_detection.")
+
+                # Calculate scaling factor
+                height, width, _ = x_i.shape
+                height_scale = self.height / height
+                width_scale = self.width / width
+
+                # Resize bounding boxes
+                y_resized["boxes"][:, 0] *= width_scale
+                y_resized["boxes"][:, 1] *= height_scale
+                y_resized["boxes"][:, 2] *= width_scale
+                y_resized["boxes"][:, 3] *= height_scale
+
+                y_preprocess.append(y_resized)
+
+        x_preprocess = np.stack(x_preprocess_list)
+        if self.clip_values is not None:
+            x_preprocess = np.clip(x_preprocess, self.clip_values[0], self.clip_values[1])
+
+        return x_preprocess, y_preprocess
+
+    def _check_params(self) -> None:
+        if self.height <= 0:
+            raise ValueError("The desired image height must be positive.")
+
+        if self.width <= 0:
+            raise ValueError("The desired image width must be positive")
+
+        if self.clip_values is not None:
+            if len(self.clip_values) != 2:
+                raise ValueError("`clip_values` should be a tuple of 2 floats containing the allowed data range.")
+
+            if self.clip_values[0] >= self.clip_values[1]:
+                raise ValueError("Invalid `clip_values`: min >= max.")
diff --git a/art/preprocessing/image/image_resize/pytorch.py b/art/preprocessing/image/image_resize/pytorch.py
@@ -0,0 +1,161 @@
+# MIT License
+#
+# Copyright (C) The Adversarial Robustness Toolbox (ART) Authors 2023
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated
+# documentation files (the "Software"), to deal in the Software without restriction, including without limitation the
+# rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit
+# persons to whom the Software is furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all copies or substantial portions of the
+# Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
+# WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
+# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+"""
+This module implements resizing for images and object detection bounding boxes in PyTorch.
+"""
+import logging
+from typing import Dict, List, Optional, TYPE_CHECKING, Tuple, Union
+
+from tqdm.auto import tqdm
+
+from art.preprocessing.preprocessing import PreprocessorPyTorch
+
+if TYPE_CHECKING:
+    # pylint: disable=C0412
+    import torch
+    from art.utils import CLIP_VALUES_TYPE
+
+logger = logging.getLogger(__name__)
+
+
+class ImageResizePyTorch(PreprocessorPyTorch):
+    """
+    This module implements resizing for images and object detection bounding boxes in PyTorch.
+    """
+
+    params = ["height", "width", "channels_first", "label_type", "interpolation", "clip_values", "verbose"]
+
+    label_types = ["classification", "object_detection"]
+
+    def __init__(
+        self,
+        height: int,
+        width: int,
+        channels_first: bool = True,
+        label_type: str = "classification",
+        interpolation: str = "bilinear",
+        clip_values: Optional["CLIP_VALUES_TYPE"] = None,
+        apply_fit: bool = True,
+        apply_predict: bool = False,
+        verbose: bool = False,
+    ):
+        """
+        Create an instance of ImageResizePyTorch.
+
+        :param height: The height of the resized image.
+        :param width: The width of the resized image.
+        :param channels_first: Set channels first or last.
+        :param label_type: String defining the label type. Currently supported: `classification`, `object_detection`
+        :param interpolation: String defining the resizing method. Currently supported: `nearest`, `linear`,
+               `bilinear`, `bicubic`, `trilinear`, `area`, `nearest-exact`
+        :param clip_values: Tuple of the form `(min, max)` representing the minimum and maximum values allowed
+               for features.
+        :param apply_fit: True if applied during fitting/training.
+        :param apply_predict: True if applied during predicting.
+        :param verbose: Show progress bars.
+        """
+        super().__init__(is_fitted=True, apply_fit=apply_fit, apply_predict=apply_predict)
+        self.height = height
+        self.width = width
+        self.channels_first = channels_first
+        self.label_type = label_type
+        self.interpolation = interpolation
+        self.clip_values = clip_values
+        self.verbose = verbose
+        self._check_params()
+
+    def forward(
+        self,
+        x: "torch.Tensor",
+        y: Optional[Union["torch.Tensor", List[Dict[str, "torch.Tensor"]]]] = None,
+    ) -> Tuple["torch.Tensor", Optional[Union["torch.Tensor", List[Dict[str, "torch.Tensor"]]]]]:
+        """
+        Resize `x` and adjust bounding boxes for labels `y` accordingly.
+
+        :param x: Input samples. A list of samples is also supported.
+        :param y: Label of the samples `x`.
+        :return: Transformed samples and labels.
+        """
+        import torch
+
+        x_preprocess_list = []
+        y_preprocess: Optional[Union[torch.Tensor, List[Dict[str, torch.Tensor]]]]
+        if y is not None and self.label_type == "object_detection":
+            y_preprocess = []
+        else:
+            y_preprocess = y
+
+        for i, x_i in enumerate(tqdm(x, desc="ImageResizePyTorch", disable=not self.verbose)):
+            if not self.channels_first:
+                x_i = torch.permute(x_i, (2, 0, 1))
+
+            # Resize image: requires a batch so create batch of size 1
+            x_resized = torch.nn.functional.interpolate(
+                x_i.unsqueeze(0), size=(self.height, self.width), mode=self.interpolation
+            ).squeeze()
+
+            if not self.channels_first:
+                x_resized = torch.permute(x_resized, (1, 2, 0))
+
+            x_preprocess_list.append(x_resized)
+
+            if self.label_type == "object_detection" and y is not None:
+                y_resized: Dict[str, torch.Tensor] = {}
+
+                # Copy labels and ensure types
+                if isinstance(y, list) and isinstance(y_preprocess, list):
+                    y_i = y[i]
+                    if isinstance(y_i, dict):
+                        y_resized = {k: torch.clone(v) for k, v in y_i.items()}
+                    else:
+                        raise TypeError("Wrong type for `y` and label_type=object_detection.")
+                else:
+                    raise TypeError("Wrong type for `y` and label_type=object_detection.")
+
+                # Calculate scaling factor
+                _, height, width = x_i.shape
+                height_scale = self.height / height
+                width_scale = self.width / width
+
+                # Resize bounding boxes
+                y_resized["boxes"][:, 0] *= width_scale
+                y_resized["boxes"][:, 1] *= height_scale
+                y_resized["boxes"][:, 2] *= width_scale
+                y_resized["boxes"][:, 3] *= height_scale
+
+                y_preprocess.append(y_resized)
+
+        x_preprocess = torch.stack(x_preprocess_list)
+        if self.clip_values is not None:
+            x_preprocess = torch.clamp(x_preprocess, self.clip_values[0], self.clip_values[1])  # type: ignore
+
+        return x_preprocess, y_preprocess
+
+    def _check_params(self) -> None:
+        if self.height <= 0:
+            raise ValueError("The desired image height must be positive.")
+
+        if self.width <= 0:
+            raise ValueError("The desired image width must be positive")
+
+        if self.clip_values is not None:
+            if len(self.clip_values) != 2:
+                raise ValueError("`clip_values` should be a tuple of 2 floats containing the allowed data range.")
+
+            if self.clip_values[0] >= self.clip_values[1]:
+                raise ValueError("Invalid `clip_values`: min >= max.")