| | """Contains an implementation of image normalizers for perceptual loss. |
| | |
| | For licensing see accompanying LICENSE file. |
| | Copyright (C) 2025 Apple Inc. All Rights Reserved. |
| | """ |
| |
|
| | from __future__ import annotations |
| |
|
| | from typing import Sequence, Union |
| |
|
| | import torch |
| | from torch import nn |
| |
|
| |
|
| | class MeanStdNormalizer(nn.Module): |
| | """Normalizing image input by mean and std.""" |
| |
|
| | mean: torch.Tensor |
| | std_inv: torch.Tensor |
| |
|
| | def __init__( |
| | self, |
| | mean: Union[Sequence[float], torch.Tensor], |
| | std: Union[Sequence[float], torch.Tensor], |
| | ): |
| | """Initialize MeanStdNormalizer.""" |
| | super(MeanStdNormalizer, self).__init__() |
| | if not isinstance(mean, torch.Tensor): |
| | mean = torch.as_tensor(mean).view(-1, 1, 1) |
| | if not isinstance(std, torch.Tensor): |
| | std = torch.as_tensor(std).view(-1, 1, 1) |
| | self.register_buffer("mean", mean) |
| | |
| | self.register_buffer("std_inv", 1.0 / std) |
| |
|
| | def forward(self, image: torch.Tensor) -> torch.Tensor: |
| | """Apply mean and std normalization over input image.""" |
| | return (image - self.mean) * self.std_inv |
| |
|
| |
|
| | class AffineRangeNormalizer(nn.Module): |
| | """Perform linear mapping to map input_range to output_range. |
| | |
| | Output_range defaults to (0, 1). |
| | """ |
| |
|
| | def __init__( |
| | self, |
| | input_range: tuple[float, float], |
| | output_range: tuple[float, float] = (0, 1), |
| | ): |
| | """Initialize AffineRangeNormalizer.""" |
| | super().__init__() |
| | input_min, input_max = input_range |
| | output_min, output_max = output_range |
| | if input_max <= input_min: |
| | raise ValueError(f"Invalid input_range: {input_range}") |
| | if output_max <= output_min: |
| | raise ValueError(f"Invalid output_range: {output_range}") |
| |
|
| | self.scale = (output_max - output_min) / (input_max - input_min) |
| | self.bias = output_min - input_min * self.scale |
| |
|
| | def forward(self, x: torch.Tensor) -> torch.Tensor: |
| | """Apply affine range normalization over input image.""" |
| | if self.scale != 1.0: |
| | x = x * self.scale |
| |
|
| | if self.bias != 0.0: |
| | x = x + self.bias |
| |
|
| | return x |
| |
|
| |
|
| | class MobileNetNormalizer(AffineRangeNormalizer): |
| | """Image normalization in mobilenet.""" |
| |
|
| | def __init__(self, input_range: tuple[float, float] = (0, 1)): |
| | """Initialize MobileNetNormalizer.""" |
| | super().__init__(input_range=input_range, output_range=(-1, 1)) |
| |
|