pytorch · datumbox · Oct 24, 2022 · Oct 24, 2022 · Oct 24, 2022 · Oct 24, 2022
diff --git a/torchvision/prototype/transforms/functional/_misc.py b/torchvision/prototype/transforms/functional/_misc.py
@@ -8,7 +8,39 @@
 from torchvision.transforms import functional_tensor as _FT
 from torchvision.transforms.functional import pil_to_tensor, to_pil_image
 
-normalize_image_tensor = _FT.normalize
+
+def normalize_image_tensor(
+    image: torch.Tensor, mean: List[float], std: List[float], inplace: bool = False
+) -> torch.Tensor:
+    if not isinstance(image, torch.Tensor):
+        raise TypeError("Input img should be Tensor image")
+
+    if not image.is_floating_point():
+        raise TypeError(f"Input tensor should be a float tensor. Got {image.dtype}.")
+
+    if image.ndim < 3:
+        raise ValueError(
+            f"Expected tensor to be a tensor image of size (..., C, H, W). Got tensor.size() = {image.size()}"
+        )
+
+    if (isinstance(std, (tuple, list)) and not all(std)) or std == 0:
-    if (isinstance(std, (tuple, list)) and not all(std)) or std == 0:
+    if not all(std):
 _NORMALIZE_MEANS_STDS = [ 
     ((0.485, 0.456, 0.406), (0.229, 0.224, 0.225)), 
     ([0.0, 0.0, 0.0], [1.0, 1.0, 1.0]), 
 ] 
 def sample_inputs_normalize_image_tensor(): 
     for image_loader, (mean, std) in itertools.product( 
         make_image_loaders(sizes=["random"], color_spaces=[features.ColorSpace.RGB], dtypes=[torch.float32]), 
         _NORMALIZE_MEANS_STDS, 
     ): 
         yield ArgsKwargs(image_loader, mean=mean, std=std) 
-    if (isinstance(std, (tuple, list)) and not all(std)) or std == 0:
+    if not all(std):
 _NORMALIZE_MEANS_STDS = [ 
     ((0.485, 0.456, 0.406), (0.229, 0.224, 0.225)), 
     ([0.0, 0.0, 0.0], [1.0, 1.0, 1.0]), 
 ] 
  
  
 def sample_inputs_normalize_image_tensor(): 
     for image_loader, (mean, std) in itertools.product( 
         make_image_loaders(sizes=["random"], color_spaces=[features.ColorSpace.RGB], dtypes=[torch.float32]), 
         _NORMALIZE_MEANS_STDS, 
     ): 
         yield ArgsKwargs(image_loader, mean=mean, std=std) 
+        raise ValueError(f"std evaluated to zero after conversion to {image.dtype}, leading to division by zero.")
+
+    dtype = image.dtype
+    device = image.device
+    mean = torch.as_tensor(mean, dtype=dtype, device=device)
+    std = torch.as_tensor(std, dtype=dtype, device=device)
+    if mean.ndim == 1:
+        mean = mean.view(-1, 1, 1)
+    if std.ndim == 1:
+        std = std.view(-1, 1, 1)
+
+    if inplace:
+        image = image.sub_(mean)
+    else:
+        image = image.sub(mean)
+
+    return image.div_(std)
 
 
 def normalize_video(video: torch.Tensor, mean: List[float], std: List[float], inplace: bool = False) -> torch.Tensor: