Source code for sc2bench.transforms.misc

import collections

import numpy as np
import torch
from PIL.Image import Image
from torch import nn
from torch.utils.data._utils.collate import np_str_obj_array_pattern, default_collate_err_msg_format
from torchdistill.common import tensor_util
from torchdistill.datasets.collator import register_collate_func
from torchdistill.datasets.transform import register_transform_class
from torchvision.transforms import functional as F
from torchvision.transforms.functional import pad

MISC_TRANSFORM_MODULE_DICT = dict()


[docs]def register_misc_transform_module(cls): """ Registers a miscellaneous transform class. :param cls: miscellaneous transform class to be registered :type cls: class :return: registered miscellaneous transform class :rtype: class """ MISC_TRANSFORM_MODULE_DICT[cls.__name__] = cls register_transform_class(cls) return cls
[docs]@register_collate_func def default_collate_w_pil(batch): """ Puts each data field into a tensor or PIL Image with outer dimension batch size. :param batch: single batch to be collated :return: collated batch """ # Extended `default_collate` function in PyTorch elem = batch[0] elem_type = type(elem) if isinstance(elem, torch.Tensor): out = None if torch.utils.data.get_worker_info() is not None: # If we're in a background process, concatenate directly into a # shared memory tensor to avoid an extra copy numel = sum(x.numel() for x in batch) storage = elem.storage()._new_shared(numel) out = elem.new(storage) return torch.stack(batch, 0, out=out) elif elem_type.__module__ == 'numpy' and elem_type.__name__ != 'str_' \ and elem_type.__name__ != 'string_': if elem_type.__name__ == 'ndarray' or elem_type.__name__ == 'memmap': # array of string classes and object if np_str_obj_array_pattern.search(elem.dtype.str) is not None: raise TypeError(default_collate_err_msg_format.format(elem.dtype)) return default_collate_w_pil([torch.as_tensor(b) for b in batch]) elif elem.shape == (): # scalars return torch.as_tensor(batch) elif isinstance(elem, float): return torch.tensor(batch, dtype=torch.float64) elif isinstance(elem, int): return torch.tensor(batch) elif isinstance(elem, (str, bytes)): return batch elif isinstance(elem, collections.abc.Mapping): return {key: default_collate_w_pil([d[key] for d in batch]) for key in elem} elif isinstance(elem, tuple) and hasattr(elem, '_fields'): # namedtuple return elem_type(*(default_collate_w_pil(samples) for samples in zip(*batch))) elif isinstance(elem, collections.abc.Sequence): # check to make sure that the elements in batch have consistent size it = iter(batch) elem_size = len(next(it)) if not all(len(elem) == elem_size for elem in it): raise RuntimeError('each element in list of batch should be of equal size') transposed = zip(*batch) return [default_collate_w_pil(samples) for samples in transposed] elif isinstance(elem, Image): return batch raise TypeError(default_collate_err_msg_format.format(elem_type))
[docs]@register_misc_transform_module class ClearTargetTransform(nn.Module): """ A transform module that replaces target with an empty list. """ def __init__(self): super().__init__()
[docs] def forward(self, sample, *args): """ Replaces target data field with an empty list. :param sample: image or image tensor :type sample: PIL.Image.Image or torch.Tensor :return: sample and an empty list :rtype: (PIL.Image.Image or torch.Tensor, list) """ return sample, list()
[docs]@register_misc_transform_module class AdaptivePad(nn.Module): """ A transform module that adaptively determines the size of padded sample. :param fill: padded value :type fill: int :param padding_position: 'hw' (default) to pad left and right for padding horizontal size // 2 and top and bottom for padding vertical size // 2; 'right_bottom' to pad bottom and right only :type padding_position: str :param padding_mode: padding mode passed to pad module :type padding_mode: str :param factor: factor value for the padded input sample :type factor: int :param returns_org_patch_size: if True, returns the patch size of the original input :type returns_org_patch_size: bool """ def __init__(self, fill=0, padding_position='hw', padding_mode='constant', factor=128, returns_org_patch_size=False): super().__init__() self.fill = fill self.padding_position = padding_position self.padding_mode = padding_mode self.factor = factor self.returns_org_patch_size = returns_org_patch_size
[docs] def forward(self, x): """ Adaptively determines the size of padded image or image tensor. :param x: image or image tensor :type x: PIL.Image.Image or torch.Tensor :return: padded image or image tensor, and the patch size of the input (height, width) if returns_org_patch_size=True :rtype: PIL.Image.Image or torch.Tensor or (PIL.Image.Image or torch.Tensor, list[int, int]) """ height, width = x.shape[-2:] vertical_pad_size = 0 if height % self.factor == 0 else int((height // self.factor + 1) * self.factor - height) horizontal_pad_size = 0 if width % self.factor == 0 else int((width // self.factor + 1) * self.factor - width) padded_vertical_size = vertical_pad_size + height padded_horizontal_size = horizontal_pad_size + width assert padded_vertical_size % self.factor == 0 and padded_horizontal_size % self.factor == 0, \ 'padded vertical and horizontal sizes ({}, {}) should be ' \ 'factor of {}'.format(padded_vertical_size, padded_horizontal_size, self.factor) padding = [horizontal_pad_size // 2, vertical_pad_size // 2] if self.padding_position == 'equal_side' \ else [0, 0, horizontal_pad_size, vertical_pad_size] x = pad(x, padding, self.fill, self.padding_mode) if self.returns_org_patch_size: return x, (height, width) return x
[docs]@register_misc_transform_module class CustomToTensor(nn.Module): """ A customized ToTensor module that can be applied to sample and target selectively. :param converts_sample: if True, applies to_tensor to sample :type converts_sample: bool :param converts_target: if True, applies torch.as_tensor to target :type converts_target: bool """ def __init__(self, converts_sample=True, converts_target=True): super().__init__() self.converts_sample = converts_sample self.converts_target = converts_target def __call__(self, image, target): if self.converts_sample: image = F.to_tensor(image) if self.converts_target: target = torch.as_tensor(np.array(target), dtype=torch.int64) return image, target
[docs]@register_misc_transform_module class SimpleQuantizer(nn.Module): """ A module to quantize tensor with its half() function if num_bits=16 (FP16) or Jacob et al.'s method if num_bits=8 (INT8 + one FP32 scale parameter). Benoit Jacob, Skirmantas Kligys, Bo Chen, Menglong Zhu, Matthew Tang, Andrew Howard, Hartwig Adam, Dmitry Kalenichenko: `"Quantization and Training of Neural Networks for Efficient Integer-Arithmetic-Only Inference" <https://openaccess.thecvf.com/content_cvpr_2018/html/Jacob_Quantization_and_Training_CVPR_2018_paper.html>`_ @ CVPR 2018 (2018) :param num_bits: number of bits for quantization :type num_bits: int """ def __init__(self, num_bits): super().__init__() self.num_bits = num_bits
[docs] def forward(self, z): """ Quantizes tensor. :param z: tensor :type z: torch.Tensor :return: quantized tensor :rtype: torch.Tensor or torchdistill.common.tensor_util.QuantizedTensor """ return z.half() if self.num_bits == 16 else tensor_util.quantize_tensor(z, self.num_bits)
[docs]@register_misc_transform_module class SimpleDequantizer(nn.Module): """ A module to dequantize quantized tensor in FP32. If num_bits=8, it uses Jacob et al.'s method. Benoit Jacob, Skirmantas Kligys, Bo Chen, Menglong Zhu, Matthew Tang, Andrew Howard, Hartwig Adam, Dmitry Kalenichenko: `"Quantization and Training of Neural Networks for Efficient Integer-Arithmetic-Only Inference" <https://openaccess.thecvf.com/content_cvpr_2018/html/Jacob_Quantization_and_Training_CVPR_2018_paper.html>`_ @ CVPR 2018 (2018) :param num_bits: number of bits used for quantization :type num_bits: int """ def __init__(self, num_bits): super().__init__() self.num_bits = num_bits
[docs] def forward(self, z): """ Dequantizes quantized tensor. :param z: quantized tensor :type z: torch.Tensor or torchdistill.common.tensor_util.QuantizedTensor :return: dequantized tensor :rtype: torch.Tensor """ return z.float() if self.num_bits == 16 else tensor_util.dequantize_tensor(z)