| """Contains an implementation of image normalizers for perceptual loss. |
| |
| For licensing see accompanying LICENSE file. |
| Copyright (C) 2025 Apple Inc. All Rights Reserved. |
| """ |
|
|
| from __future__ import annotations |
|
|
| from typing import Sequence, Union |
|
|
| import torch |
| from torch import nn |
|
|
|
|
| class MeanStdNormalizer(nn.Module): |
| """Normalizing image input by mean and std.""" |
|
|
| mean: torch.Tensor |
| std_inv: torch.Tensor |
|
|
| def __init__( |
| self, |
| mean: Union[Sequence[float], torch.Tensor], |
| std: Union[Sequence[float], torch.Tensor], |
| ): |
| """Initialize MeanStdNormalizer.""" |
| super(MeanStdNormalizer, self).__init__() |
| if not isinstance(mean, torch.Tensor): |
| mean = torch.as_tensor(mean).view(-1, 1, 1) |
| if not isinstance(std, torch.Tensor): |
| std = torch.as_tensor(std).view(-1, 1, 1) |
| self.register_buffer("mean", mean) |
| |
| self.register_buffer("std_inv", 1.0 / std) |
|
|
| def forward(self, image: torch.Tensor) -> torch.Tensor: |
| """Apply mean and std normalization over input image.""" |
| return (image - self.mean) * self.std_inv |
|
|
|
|
| class AffineRangeNormalizer(nn.Module): |
| """Perform linear mapping to map input_range to output_range. |
| |
| Output_range defaults to (0, 1). |
| """ |
|
|
| def __init__( |
| self, |
| input_range: tuple[float, float], |
| output_range: tuple[float, float] = (0, 1), |
| ): |
| """Initialize AffineRangeNormalizer.""" |
| super().__init__() |
| input_min, input_max = input_range |
| output_min, output_max = output_range |
| if input_max <= input_min: |
| raise ValueError(f"Invalid input_range: {input_range}") |
| if output_max <= output_min: |
| raise ValueError(f"Invalid output_range: {output_range}") |
|
|
| self.scale = (output_max - output_min) / (input_max - input_min) |
| self.bias = output_min - input_min * self.scale |
|
|
| def forward(self, x: torch.Tensor) -> torch.Tensor: |
| """Apply affine range normalization over input image.""" |
| if self.scale != 1.0: |
| x = x * self.scale |
|
|
| if self.bias != 0.0: |
| x = x + self.bias |
|
|
| return x |
|
|
|
|
| class MobileNetNormalizer(AffineRangeNormalizer): |
| """Image normalization in mobilenet.""" |
|
|
| def __init__(self, input_range: tuple[float, float] = (0, 1)): |
| """Initialize MobileNetNormalizer.""" |
| super().__init__(input_range=input_range, output_range=(-1, 1)) |
|
|