Update Resize transformer to use scikit-image instead of scipy.misc

thrau · thrau · commit ddfb4daf57dd · 2021-03-09T18:58:38.000+01:00
diff --git a/dataloaders/transforms.py b/dataloaders/transforms.py
@@ -4,6 +4,7 @@
 import random
 
 from PIL import Image, ImageOps, ImageEnhance
+
 try:
     import accimage
 except ImportError:
@@ -16,21 +17,24 @@
 import warnings
 
 import scipy.ndimage.interpolation as itpl
-import scipy.misc as misc
+from skimage.transform import resize as imresize
 
 
 def _is_numpy_image(img):
     return isinstance(img, np.ndarray) and (img.ndim in {2, 3})
 
+
 def _is_pil_image(img):
     if accimage is not None:
         return isinstance(img, (Image.Image, accimage.Image))
     else:
         return isinstance(img, Image.Image)
 
+
 def _is_tensor_image(img):
     return torch.is_tensor(img) and img.ndimension() == 3
 
+
 def adjust_brightness(img, brightness_factor):
     """Adjust brightness of an Image.
 
@@ -114,7 +118,7 @@ def adjust_hue(img, hue_factor):
     Returns:
         PIL Image: Hue adjusted image.
     """
-    if not(-0.5 <= hue_factor <= 0.5):
+    if not (-0.5 <= hue_factor <= 0.5):
         raise ValueError('hue_factor is not in [-0.5, 0.5].'.format(hue_factor))
 
     if not _is_pil_image(img):
@@ -207,7 +211,7 @@ def __call__(self, img):
         Returns:
             Tensor: Converted image.
         """
-        if not(_is_numpy_image(img)):
+        if not (_is_numpy_image(img)):
             raise TypeError('img should be ndarray. Got {}'.format(type(img)))
 
         if isinstance(img, np.ndarray):
@@ -247,14 +251,15 @@ def __call__(self, img):
         Returns:
             Tensor: Normalized image.
         """
-        if not(_is_numpy_image(img)):
+        if not (_is_numpy_image(img)):
             raise TypeError('img should be ndarray. Got {}'.format(type(img)))
         # TODO: make efficient
         print(img.shape)
         for i in range(3):
-            img[:,:,i] = (img[:,:,i] - self.mean[i]) / self.std[i]
+            img[:, :, i] = (img[:, :, i] - self.mean[i]) / self.std[i]
         return img
 
+
 class NormalizeTensor(object):
     """Normalize an tensor image with mean and standard deviation.
     Given mean: ``(M1,...,Mn)`` and std: ``(M1,..,Mn)`` for ``n`` channels, this transform
@@ -285,6 +290,7 @@ def __call__(self, tensor):
             t.sub_(m).div_(s)
         return tensor
 
+
 class Rotate(object):
     """Rotates the given ``numpy.ndarray``.
 
@@ -333,10 +339,16 @@ def __call__(self, img):
         Returns:
             PIL Image: Rescaled image.
         """
+        if isinstance(self.size, numbers.Number):
+            h, w = img.shape[0], img.shape[1]
+            shape = (int(h * self.size), int(w * self.size))
+        else:
+            shape = self.size
+
         if img.ndim == 3:
-            return misc.imresize(img, self.size, self.interpolation)
+            return imresize(img, shape)
         elif img.ndim == 2:
-            return misc.imresize(img, self.size, self.interpolation, 'F')
+            return imresize(img, shape)
         else:
             RuntimeError('img should be ndarray with 2 or 3 dimensions. Got {}'.format(img.ndim))
 
@@ -395,15 +407,16 @@ def __call__(self, img):
         h: Height of the cropped image.
         w: Width of the cropped image.
         """
-        if not(_is_numpy_image(img)):
+        if not (_is_numpy_image(img)):
             raise TypeError('img should be ndarray. Got {}'.format(type(img)))
         if img.ndim == 3:
-            return img[i:i+h, j:j+w, :]
+            return img[i:i + h, j:j + w, :]
         elif img.ndim == 2:
             return img[i:i + h, j:j + w]
         else:
             raise RuntimeError('img should be ndarray with 2 or 3 dimensions. Got {}'.format(img.ndim))
 
+
 class BottomCrop(object):
     """Crops the given ``numpy.ndarray`` at the bottom.
 
@@ -458,15 +471,16 @@ def __call__(self, img):
         h: Height of the cropped image.
         w: Width of the cropped image.
         """
-        if not(_is_numpy_image(img)):
+        if not (_is_numpy_image(img)):
             raise TypeError('img should be ndarray. Got {}'.format(type(img)))
         if img.ndim == 3:
-            return img[i:i+h, j:j+w, :]
+            return img[i:i + h, j:j + w, :]
         elif img.ndim == 2:
             return img[i:i + h, j:j + w]
         else:
             raise RuntimeError('img should be ndarray with 2 or 3 dimensions. Got {}'.format(img.ndim))
 
+
 class Lambda(object):
     """Apply a user-defined lambda as a transform.
 
@@ -501,7 +515,7 @@ def __call__(self, img):
         Returns:
             img (numpy.ndarray (C x H x W)): flipped image.
         """
-        if not(_is_numpy_image(img)):
+        if not (_is_numpy_image(img)):
             raise TypeError('img should be ndarray. Got {}'.format(type(img)))
 
         if self.do_flip:
@@ -523,6 +537,7 @@ class ColorJitter(object):
         hue(float): How much to jitter hue. hue_factor is chosen uniformly from
             [-hue, hue]. Should be >=0 and <= 0.5.
     """
+
     def __init__(self, brightness=0, contrast=0, saturation=0, hue=0):
         self.brightness = brightness
         self.contrast = contrast
@@ -569,14 +584,15 @@ def __call__(self, img):
         Returns:
             img (numpy.ndarray (C x H x W)): Color jittered image.
         """
-        if not(_is_numpy_image(img)):
+        if not (_is_numpy_image(img)):
             raise TypeError('img should be ndarray. Got {}'.format(type(img)))
 
         pil = Image.fromarray(img)
         transform = self.get_params(self.brightness, self.contrast,
                                     self.saturation, self.hue)
         return np.array(transform(pil))
 
+
 class Crop(object):
     """Crops the given PIL Image to a rectangular region based on a given
     4-tuple defining the left, upper pixel coordinated, hight and width size.
@@ -607,7 +623,7 @@ def __call__(self, img):
 
         i, j, h, w = self.i, self.j, self.h, self.w
 
-        if not(_is_numpy_image(img)):
+        if not (_is_numpy_image(img)):
             raise TypeError('img should be ndarray. Got {}'.format(type(img)))
         if img.ndim == 3:
             return img[i:i + h, j:j + w, :]