Spaces:

NewLabs
/

NewFilm-T2V

Sleeping

App Files Files Community

NewLabs commited on Apr 12

Commit

a0929d8

•

1 Parent(s): 1b01078

Upload 372 files

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +2 -0
torchvision/_C.so +3 -0
torchvision/__init__.py +114 -0
torchvision/__pycache__/__init__.cpython-38.pyc +0 -0
torchvision/__pycache__/_internally_replaced_utils.cpython-38.pyc +0 -0
torchvision/__pycache__/_utils.cpython-38.pyc +0 -0
torchvision/__pycache__/extension.cpython-38.pyc +0 -0
torchvision/__pycache__/utils.cpython-38.pyc +0 -0
torchvision/__pycache__/version.cpython-38.pyc +0 -0
torchvision/_internally_replaced_utils.py +58 -0
torchvision/_utils.py +32 -0
torchvision/datapoints/__init__.py +12 -0
torchvision/datapoints/__pycache__/__init__.cpython-38.pyc +0 -0
torchvision/datapoints/__pycache__/_bounding_box.cpython-38.pyc +0 -0
torchvision/datapoints/__pycache__/_datapoint.cpython-38.pyc +0 -0
torchvision/datapoints/__pycache__/_dataset_wrapper.cpython-38.pyc +0 -0
torchvision/datapoints/__pycache__/_image.cpython-38.pyc +0 -0
torchvision/datapoints/__pycache__/_mask.cpython-38.pyc +0 -0
torchvision/datapoints/__pycache__/_video.cpython-38.pyc +0 -0
torchvision/datapoints/_bounding_box.py +237 -0
torchvision/datapoints/_datapoint.py +259 -0
torchvision/datapoints/_dataset_wrapper.py +499 -0
torchvision/datapoints/_image.py +260 -0
torchvision/datapoints/_mask.py +158 -0
torchvision/datapoints/_video.py +250 -0
torchvision/datasets/__init__.py +145 -0
torchvision/datasets/__pycache__/__init__.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/_optical_flow.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/_stereo_matching.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/caltech.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/celeba.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/cifar.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/cityscapes.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/clevr.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/coco.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/country211.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/dtd.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/eurosat.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/fakedata.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/fer2013.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/fgvc_aircraft.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/flickr.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/flowers102.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/folder.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/food101.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/gtsrb.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/hmdb51.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/imagenet.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/inaturalist.cpython-38.pyc +0 -0
torchvision/datasets/__pycache__/kinetics.cpython-38.pyc +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+torchvision/_C.so filter=lfs diff=lfs merge=lfs -text
+torchvision/image.so filter=lfs diff=lfs merge=lfs -text

torchvision/_C.so ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1f60f9e860992a1c25bbad7efc84b2036c82da5f23c976995dbdefeab6ff5d73
+size 70104344

torchvision/__init__.py ADDED Viewed

	@@ -0,0 +1,114 @@

+import os
+import warnings
+from modulefinder import Module
+import torch
+from torchvision import datasets, io, models, ops, transforms, utils
+from .extension import _HAS_OPS
+try:
+    from .version import __version__  # noqa: F401
+except ImportError:
+    pass
+# Check if torchvision is being imported within the root folder
+if not _HAS_OPS and os.path.dirname(os.path.realpath(__file__)) == os.path.join(
+    os.path.realpath(os.getcwd()), "torchvision"
+):
+    message = (
+        "You are importing torchvision within its own root folder ({}). "
+        "This is not expected to work and may give errors. Please exit the "
+        "torchvision project source and relaunch your python interpreter."
+    )
+    warnings.warn(message.format(os.getcwd()))
+_image_backend = "PIL"
+_video_backend = "pyav"
+def set_image_backend(backend):
+    """
+    Specifies the package used to load images.
+    Args:
+        backend (string): Name of the image backend. one of {'PIL', 'accimage'}.
+            The :mod:`accimage` package uses the Intel IPP library. It is
+            generally faster than PIL, but does not support as many operations.
+    """
+    global _image_backend
+    if backend not in ["PIL", "accimage"]:
+        raise ValueError(f"Invalid backend '{backend}'. Options are 'PIL' and 'accimage'")
+    _image_backend = backend
+def get_image_backend():
+    """
+    Gets the name of the package used to load images
+    """
+    return _image_backend
+def set_video_backend(backend):
+    """
+    Specifies the package used to decode videos.
+    Args:
+        backend (string): Name of the video backend. one of {'pyav', 'video_reader'}.
+            The :mod:`pyav` package uses the 3rd party PyAv library. It is a Pythonic
+            binding for the FFmpeg libraries.
+            The :mod:`video_reader` package includes a native C++ implementation on
+            top of FFMPEG libraries, and a python API of TorchScript custom operator.
+            It generally decodes faster than :mod:`pyav`, but is perhaps less robust.
+    .. note::
+        Building with FFMPEG is disabled by default in the latest `main`. If you want to use the 'video_reader'
+        backend, please compile torchvision from source.
+    """
+    global _video_backend
+    if backend not in ["pyav", "video_reader", "cuda"]:
+        raise ValueError("Invalid video backend '%s'. Options are 'pyav', 'video_reader' and 'cuda'" % backend)
+    if backend == "video_reader" and not io._HAS_VIDEO_OPT:
+        # TODO: better messages
+        message = "video_reader video backend is not available. Please compile torchvision from source and try again"
+        raise RuntimeError(message)
+    elif backend == "cuda" and not io._HAS_GPU_VIDEO_DECODER:
+        # TODO: better messages
+        message = "cuda video backend is not available."
+        raise RuntimeError(message)
+    else:
+        _video_backend = backend
+def get_video_backend():
+    """
+    Returns the currently active video backend used to decode videos.
+    Returns:
+        str: Name of the video backend. one of {'pyav', 'video_reader'}.
+    """
+    return _video_backend
+def _is_tracing():
+    return torch._C._get_tracing_state()
+_WARN_ABOUT_BETA_TRANSFORMS = True
+_BETA_TRANSFORMS_WARNING = (
+    "The torchvision.datapoints and torchvision.transforms.v2 namespaces are still Beta. "
+    "While we do not expect major breaking changes, some APIs may still change "
+    "according to user feedback. Please submit any feedback you may have in "
+    "this issue: https://github.com/pytorch/vision/issues/6753, and you can also "
+    "check out https://github.com/pytorch/vision/issues/7319 to learn more about "
+    "the APIs that we suspect might involve future changes. "
+    "You can silence this warning by calling torchvision.disable_beta_transforms_warning()."
+)
+def disable_beta_transforms_warning():
+    global _WARN_ABOUT_BETA_TRANSFORMS
+    _WARN_ABOUT_BETA_TRANSFORMS = False

torchvision/__pycache__/__init__.cpython-38.pyc ADDED Viewed

Binary file (4.07 kB). View file

torchvision/__pycache__/_internally_replaced_utils.cpython-38.pyc ADDED Viewed

Binary file (1.76 kB). View file

torchvision/__pycache__/_utils.cpython-38.pyc ADDED Viewed

Binary file (1.46 kB). View file

torchvision/__pycache__/extension.cpython-38.pyc ADDED Viewed

Binary file (2.93 kB). View file

torchvision/__pycache__/utils.cpython-38.pyc ADDED Viewed

Binary file (18.8 kB). View file

torchvision/__pycache__/version.cpython-38.pyc ADDED Viewed

Binary file (367 Bytes). View file

torchvision/_internally_replaced_utils.py ADDED Viewed

	@@ -0,0 +1,58 @@

+import importlib.machinery
+import os
+from torch.hub import _get_torch_home
+_HOME = os.path.join(_get_torch_home(), "datasets", "vision")
+_USE_SHARDED_DATASETS = False
+def _download_file_from_remote_location(fpath: str, url: str) -> None:
+    pass
+def _is_remote_location_available() -> bool:
+    return False
+try:
+    from torch.hub import load_state_dict_from_url  # noqa: 401
+except ImportError:
+    from torch.utils.model_zoo import load_url as load_state_dict_from_url  # noqa: 401
+def _get_extension_path(lib_name):
+    lib_dir = os.path.dirname(__file__)
+    if os.name == "nt":
+        # Register the main torchvision library location on the default DLL path
+        import ctypes
+        import sys
+        kernel32 = ctypes.WinDLL("kernel32.dll", use_last_error=True)
+        with_load_library_flags = hasattr(kernel32, "AddDllDirectory")
+        prev_error_mode = kernel32.SetErrorMode(0x0001)
+        if with_load_library_flags:
+            kernel32.AddDllDirectory.restype = ctypes.c_void_p
+        if sys.version_info >= (3, 8):
+            os.add_dll_directory(lib_dir)
+        elif with_load_library_flags:
+            res = kernel32.AddDllDirectory(lib_dir)
+            if res is None:
+                err = ctypes.WinError(ctypes.get_last_error())
+                err.strerror += f' Error adding "{lib_dir}" to the DLL directories.'
+                raise err
+        kernel32.SetErrorMode(prev_error_mode)
+    loader_details = (importlib.machinery.ExtensionFileLoader, importlib.machinery.EXTENSION_SUFFIXES)
+    extfinder = importlib.machinery.FileFinder(lib_dir, loader_details)
+    ext_specs = extfinder.find_spec(lib_name)
+    if ext_specs is None:
+        raise ImportError
+    return ext_specs.origin

torchvision/_utils.py ADDED Viewed

	@@ -0,0 +1,32 @@

+import enum
+from typing import Sequence, Type, TypeVar
+T = TypeVar("T", bound=enum.Enum)
+class StrEnumMeta(enum.EnumMeta):
+    auto = enum.auto
+    def from_str(self: Type[T], member: str) -> T:  # type: ignore[misc]
+        try:
+            return self[member]
+        except KeyError:
+            # TODO: use `add_suggestion` from torchvision.prototype.utils._internal to improve the error message as
+            #  soon as it is migrated.
+            raise ValueError(f"Unknown value '{member}' for {self.__name__}.") from None
+class StrEnum(enum.Enum, metaclass=StrEnumMeta):
+    pass
+def sequence_to_str(seq: Sequence, separate_last: str = "") -> str:
+    if not seq:
+        return ""
+    if len(seq) == 1:
+        return f"'{seq[0]}'"
+    head = "'" + "', '".join([str(item) for item in seq[:-1]]) + "'"
+    tail = f"{'' if separate_last and len(seq) == 2 else ','} {separate_last}'{seq[-1]}'"
+    return head + tail

torchvision/datapoints/__init__.py ADDED Viewed

	@@ -0,0 +1,12 @@

+from torchvision import _BETA_TRANSFORMS_WARNING, _WARN_ABOUT_BETA_TRANSFORMS
+from ._bounding_box import BoundingBox, BoundingBoxFormat
+from ._datapoint import _FillType, _FillTypeJIT, _InputType, _InputTypeJIT
+from ._image import _ImageType, _ImageTypeJIT, _TensorImageType, _TensorImageTypeJIT, Image
+from ._mask import Mask
+from ._video import _TensorVideoType, _TensorVideoTypeJIT, _VideoType, _VideoTypeJIT, Video
+if _WARN_ABOUT_BETA_TRANSFORMS:
+    import warnings
+    warnings.warn(_BETA_TRANSFORMS_WARNING)

torchvision/datapoints/__pycache__/__init__.cpython-38.pyc ADDED Viewed

Binary file (840 Bytes). View file

torchvision/datapoints/__pycache__/_bounding_box.cpython-38.pyc ADDED Viewed

Binary file (8.02 kB). View file

torchvision/datapoints/__pycache__/_datapoint.cpython-38.pyc ADDED Viewed

Binary file (10 kB). View file

torchvision/datapoints/__pycache__/_dataset_wrapper.cpython-38.pyc ADDED Viewed

Binary file (16.3 kB). View file

torchvision/datapoints/__pycache__/_image.cpython-38.pyc ADDED Viewed

Binary file (10.4 kB). View file

torchvision/datapoints/__pycache__/_mask.cpython-38.pyc ADDED Viewed

Binary file (5.98 kB). View file

torchvision/datapoints/__pycache__/_video.cpython-38.pyc ADDED Viewed

Binary file (10.1 kB). View file

torchvision/datapoints/_bounding_box.py ADDED Viewed

	@@ -0,0 +1,237 @@

+from __future__ import annotations
+from enum import Enum
+from typing import Any, List, Optional, Sequence, Tuple, Union
+import torch
+from torchvision.transforms import InterpolationMode  # TODO: this needs to be moved out of transforms
+from ._datapoint import _FillTypeJIT, Datapoint
+class BoundingBoxFormat(Enum):
+    """[BETA] Coordinate format of a bounding box.
+    Available formats are
+    * ``XYXY``
+    * ``XYWH``
+    * ``CXCYWH``
+    """
+    XYXY = "XYXY"
+    XYWH = "XYWH"
+    CXCYWH = "CXCYWH"
+class BoundingBox(Datapoint):
+    """[BETA] :class:`torch.Tensor` subclass for bounding boxes.
+    Args:
+        data: Any data that can be turned into a tensor with :func:`torch.as_tensor`.
+        format (BoundingBoxFormat, str): Format of the bounding box.
+        spatial_size (two-tuple of ints): Height and width of the corresponding image or video.
+        dtype (torch.dtype, optional): Desired data type of the bounding box. If omitted, will be inferred from
+            ``data``.
+        device (torch.device, optional): Desired device of the bounding box. If omitted and ``data`` is a
+            :class:`torch.Tensor`, the device is taken from it. Otherwise, the bounding box is constructed on the CPU.
+        requires_grad (bool, optional): Whether autograd should record operations on the bounding box. If omitted and
+            ``data`` is a :class:`torch.Tensor`, the value is taken from it. Otherwise, defaults to ``False``.
+    """
+    format: BoundingBoxFormat
+    spatial_size: Tuple[int, int]
+    @classmethod
+    def _wrap(cls, tensor: torch.Tensor, *, format: BoundingBoxFormat, spatial_size: Tuple[int, int]) -> BoundingBox:
+        bounding_box = tensor.as_subclass(cls)
+        bounding_box.format = format
+        bounding_box.spatial_size = spatial_size
+        return bounding_box
+    def __new__(
+        cls,
+        data: Any,
+        *,
+        format: Union[BoundingBoxFormat, str],
+        spatial_size: Tuple[int, int],
+        dtype: Optional[torch.dtype] = None,
+        device: Optional[Union[torch.device, str, int]] = None,
+        requires_grad: Optional[bool] = None,
+    ) -> BoundingBox:
+        tensor = cls._to_tensor(data, dtype=dtype, device=device, requires_grad=requires_grad)
+        if isinstance(format, str):
+            format = BoundingBoxFormat[format.upper()]
+        return cls._wrap(tensor, format=format, spatial_size=spatial_size)
+    @classmethod
+    def wrap_like(
+        cls,
+        other: BoundingBox,
+        tensor: torch.Tensor,
+        *,
+        format: Optional[BoundingBoxFormat] = None,
+        spatial_size: Optional[Tuple[int, int]] = None,
+    ) -> BoundingBox:
+        """Wrap a :class:`torch.Tensor` as :class:`BoundingBox` from a reference.
+        Args:
+            other (BoundingBox): Reference bounding box.
+            tensor (Tensor): Tensor to be wrapped as :class:`BoundingBox`
+            format (BoundingBoxFormat, str, optional): Format of the bounding box.  If omitted, it is taken from the
+                reference.
+            spatial_size (two-tuple of ints, optional): Height and width of the corresponding image or video. If
+                omitted, it is taken from the reference.
+        """
+        if isinstance(format, str):
+            format = BoundingBoxFormat[format.upper()]
+        return cls._wrap(
+            tensor,
+            format=format if format is not None else other.format,
+            spatial_size=spatial_size if spatial_size is not None else other.spatial_size,
+        )
+    def __repr__(self, *, tensor_contents: Any = None) -> str:  # type: ignore[override]
+        return self._make_repr(format=self.format, spatial_size=self.spatial_size)
+    def horizontal_flip(self) -> BoundingBox:
+        output = self._F.horizontal_flip_bounding_box(
+            self.as_subclass(torch.Tensor), format=self.format, spatial_size=self.spatial_size
+        )
+        return BoundingBox.wrap_like(self, output)
+    def vertical_flip(self) -> BoundingBox:
+        output = self._F.vertical_flip_bounding_box(
+            self.as_subclass(torch.Tensor), format=self.format, spatial_size=self.spatial_size
+        )
+        return BoundingBox.wrap_like(self, output)
+    def resize(  # type: ignore[override]
+        self,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        max_size: Optional[int] = None,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> BoundingBox:
+        output, spatial_size = self._F.resize_bounding_box(
+            self.as_subclass(torch.Tensor),
+            spatial_size=self.spatial_size,
+            size=size,
+            max_size=max_size,
+        )
+        return BoundingBox.wrap_like(self, output, spatial_size=spatial_size)
+    def crop(self, top: int, left: int, height: int, width: int) -> BoundingBox:
+        output, spatial_size = self._F.crop_bounding_box(
+            self.as_subclass(torch.Tensor), self.format, top=top, left=left, height=height, width=width
+        )
+        return BoundingBox.wrap_like(self, output, spatial_size=spatial_size)
+    def center_crop(self, output_size: List[int]) -> BoundingBox:
+        output, spatial_size = self._F.center_crop_bounding_box(
+            self.as_subclass(torch.Tensor), format=self.format, spatial_size=self.spatial_size, output_size=output_size
+        )
+        return BoundingBox.wrap_like(self, output, spatial_size=spatial_size)
+    def resized_crop(
+        self,
+        top: int,
+        left: int,
+        height: int,
+        width: int,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> BoundingBox:
+        output, spatial_size = self._F.resized_crop_bounding_box(
+            self.as_subclass(torch.Tensor), self.format, top, left, height, width, size=size
+        )
+        return BoundingBox.wrap_like(self, output, spatial_size=spatial_size)
+    def pad(
+        self,
+        padding: Union[int, Sequence[int]],
+        fill: Optional[Union[int, float, List[float]]] = None,
+        padding_mode: str = "constant",
+    ) -> BoundingBox:
+        output, spatial_size = self._F.pad_bounding_box(
+            self.as_subclass(torch.Tensor),
+            format=self.format,
+            spatial_size=self.spatial_size,
+            padding=padding,
+            padding_mode=padding_mode,
+        )
+        return BoundingBox.wrap_like(self, output, spatial_size=spatial_size)
+    def rotate(
+        self,
+        angle: float,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        expand: bool = False,
+        center: Optional[List[float]] = None,
+        fill: _FillTypeJIT = None,
+    ) -> BoundingBox:
+        output, spatial_size = self._F.rotate_bounding_box(
+            self.as_subclass(torch.Tensor),
+            format=self.format,
+            spatial_size=self.spatial_size,
+            angle=angle,
+            expand=expand,
+            center=center,
+        )
+        return BoundingBox.wrap_like(self, output, spatial_size=spatial_size)
+    def affine(
+        self,
+        angle: Union[int, float],
+        translate: List[float],
+        scale: float,
+        shear: List[float],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        fill: _FillTypeJIT = None,
+        center: Optional[List[float]] = None,
+    ) -> BoundingBox:
+        output = self._F.affine_bounding_box(
+            self.as_subclass(torch.Tensor),
+            self.format,
+            self.spatial_size,
+            angle,
+            translate=translate,
+            scale=scale,
+            shear=shear,
+            center=center,
+        )
+        return BoundingBox.wrap_like(self, output)
+    def perspective(
+        self,
+        startpoints: Optional[List[List[int]]],
+        endpoints: Optional[List[List[int]]],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        fill: _FillTypeJIT = None,
+        coefficients: Optional[List[float]] = None,
+    ) -> BoundingBox:
+        output = self._F.perspective_bounding_box(
+            self.as_subclass(torch.Tensor),
+            format=self.format,
+            spatial_size=self.spatial_size,
+            startpoints=startpoints,
+            endpoints=endpoints,
+            coefficients=coefficients,
+        )
+        return BoundingBox.wrap_like(self, output)
+    def elastic(
+        self,
+        displacement: torch.Tensor,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        fill: _FillTypeJIT = None,
+    ) -> BoundingBox:
+        output = self._F.elastic_bounding_box(
+            self.as_subclass(torch.Tensor), self.format, self.spatial_size, displacement=displacement
+        )
+        return BoundingBox.wrap_like(self, output)

torchvision/datapoints/_datapoint.py ADDED Viewed

	@@ -0,0 +1,259 @@

+from __future__ import annotations
+from types import ModuleType
+from typing import Any, Callable, List, Mapping, Optional, Sequence, Tuple, Type, TypeVar, Union
+import PIL.Image
+import torch
+from torch._C import DisableTorchFunctionSubclass
+from torch.types import _device, _dtype, _size
+from torchvision.transforms import InterpolationMode
+D = TypeVar("D", bound="Datapoint")
+_FillType = Union[int, float, Sequence[int], Sequence[float], None]
+_FillTypeJIT = Optional[List[float]]
+class Datapoint(torch.Tensor):
+    __F: Optional[ModuleType] = None
+    @staticmethod
+    def _to_tensor(
+        data: Any,
+        dtype: Optional[torch.dtype] = None,
+        device: Optional[Union[torch.device, str, int]] = None,
+        requires_grad: Optional[bool] = None,
+    ) -> torch.Tensor:
+        if requires_grad is None:
+            requires_grad = data.requires_grad if isinstance(data, torch.Tensor) else False
+        return torch.as_tensor(data, dtype=dtype, device=device).requires_grad_(requires_grad)
+    @classmethod
+    def wrap_like(cls: Type[D], other: D, tensor: torch.Tensor) -> D:
+        raise NotImplementedError
+    _NO_WRAPPING_EXCEPTIONS = {
+        torch.Tensor.clone: lambda cls, input, output: cls.wrap_like(input, output),
+        torch.Tensor.to: lambda cls, input, output: cls.wrap_like(input, output),
+        # We don't need to wrap the output of `Tensor.requires_grad_`, since it is an inplace operation and thus
+        # retains the type automatically
+        torch.Tensor.requires_grad_: lambda cls, input, output: output,
+    }
+    @classmethod
+    def __torch_function__(
+        cls,
+        func: Callable[..., torch.Tensor],
+        types: Tuple[Type[torch.Tensor], ...],
+        args: Sequence[Any] = (),
+        kwargs: Optional[Mapping[str, Any]] = None,
+    ) -> torch.Tensor:
+        """For general information about how the __torch_function__ protocol works,
+        see https://pytorch.org/docs/stable/notes/extending.html#extending-torch
+        TL;DR: Every time a PyTorch operator is called, it goes through the inputs and looks for the
+        ``__torch_function__`` method. If one is found, it is invoked with the operator as ``func`` as well as the
+        ``args`` and ``kwargs`` of the original call.
+        The default behavior of :class:`~torch.Tensor`'s is to retain a custom tensor type. For the :class:`Datapoint`
+        use case, this has two downsides:
+        1. Since some :class:`Datapoint`'s require metadata to be constructed, the default wrapping, i.e.
+           ``return cls(func(*args, **kwargs))``, will fail for them.
+        2. For most operations, there is no way of knowing if the input type is still valid for the output.
+        For these reasons, the automatic output wrapping is turned off for most operators. The only exceptions are
+        listed in :attr:`Datapoint._NO_WRAPPING_EXCEPTIONS`
+        """
+        # Since super().__torch_function__ has no hook to prevent the coercing of the output into the input type, we
+        # need to reimplement the functionality.
+        if not all(issubclass(cls, t) for t in types):
+            return NotImplemented
+        with DisableTorchFunctionSubclass():
+            output = func(*args, **kwargs or dict())
+            wrapper = cls._NO_WRAPPING_EXCEPTIONS.get(func)
+            # Apart from `func` needing to be an exception, we also require the primary operand, i.e. `args[0]`, to be
+            # an instance of the class that `__torch_function__` was invoked on. The __torch_function__ protocol will
+            # invoke this method on *all* types involved in the computation by walking the MRO upwards. For example,
+            # `torch.Tensor(...).to(datapoints.Image(...))` will invoke `datapoints.Image.__torch_function__` with
+            # `args = (torch.Tensor(), datapoints.Image())` first. Without this guard, the original `torch.Tensor` would
+            # be wrapped into a `datapoints.Image`.
+            if wrapper and isinstance(args[0], cls):
+                return wrapper(cls, args[0], output)
+            # Inplace `func`'s, canonically identified with a trailing underscore in their name like `.add_(...)`,
+            # will retain the input type. Thus, we need to unwrap here.
+            if isinstance(output, cls):
+                return output.as_subclass(torch.Tensor)
+            return output
+    def _make_repr(self, **kwargs: Any) -> str:
+        # This is a poor man's implementation of the proposal in https://github.com/pytorch/pytorch/issues/76532.
+        # If that ever gets implemented, remove this in favor of the solution on the `torch.Tensor` class.
+        extra_repr = ", ".join(f"{key}={value}" for key, value in kwargs.items())
+        return f"{super().__repr__()[:-1]}, {extra_repr})"
+    @property
+    def _F(self) -> ModuleType:
+        # This implements a lazy import of the functional to get around the cyclic import. This import is deferred
+        # until the first time we need reference to the functional module and it's shared across all instances of
+        # the class. This approach avoids the DataLoader issue described at
+        # https://github.com/pytorch/vision/pull/6476#discussion_r953588621
+        if Datapoint.__F is None:
+            from ..transforms.v2 import functional
+            Datapoint.__F = functional
+        return Datapoint.__F
+    # Add properties for common attributes like shape, dtype, device, ndim etc
+    # this way we return the result without passing into __torch_function__
+    @property
+    def shape(self) -> _size:  # type: ignore[override]
+        with DisableTorchFunctionSubclass():
+            return super().shape
+    @property
+    def ndim(self) -> int:  # type: ignore[override]
+        with DisableTorchFunctionSubclass():
+            return super().ndim
+    @property
+    def device(self, *args: Any, **kwargs: Any) -> _device:  # type: ignore[override]
+        with DisableTorchFunctionSubclass():
+            return super().device
+    @property
+    def dtype(self) -> _dtype:  # type: ignore[override]
+        with DisableTorchFunctionSubclass():
+            return super().dtype
+    def horizontal_flip(self) -> Datapoint:
+        return self
+    def vertical_flip(self) -> Datapoint:
+        return self
+    # TODO: We have to ignore override mypy error as there is torch.Tensor built-in deprecated op: Tensor.resize
+    # https://github.com/pytorch/pytorch/blob/e8727994eb7cdb2ab642749d6549bc497563aa06/torch/_tensor.py#L588-L593
+    def resize(  # type: ignore[override]
+        self,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        max_size: Optional[int] = None,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> Datapoint:
+        return self
+    def crop(self, top: int, left: int, height: int, width: int) -> Datapoint:
+        return self
+    def center_crop(self, output_size: List[int]) -> Datapoint:
+        return self
+    def resized_crop(
+        self,
+        top: int,
+        left: int,
+        height: int,
+        width: int,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> Datapoint:
+        return self
+    def pad(
+        self,
+        padding: List[int],
+        fill: Optional[Union[int, float, List[float]]] = None,
+        padding_mode: str = "constant",
+    ) -> Datapoint:
+        return self
+    def rotate(
+        self,
+        angle: float,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        expand: bool = False,
+        center: Optional[List[float]] = None,
+        fill: _FillTypeJIT = None,
+    ) -> Datapoint:
+        return self
+    def affine(
+        self,
+        angle: Union[int, float],
+        translate: List[float],
+        scale: float,
+        shear: List[float],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        fill: _FillTypeJIT = None,
+        center: Optional[List[float]] = None,
+    ) -> Datapoint:
+        return self
+    def perspective(
+        self,
+        startpoints: Optional[List[List[int]]],
+        endpoints: Optional[List[List[int]]],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        fill: _FillTypeJIT = None,
+        coefficients: Optional[List[float]] = None,
+    ) -> Datapoint:
+        return self
+    def elastic(
+        self,
+        displacement: torch.Tensor,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        fill: _FillTypeJIT = None,
+    ) -> Datapoint:
+        return self
+    def rgb_to_grayscale(self, num_output_channels: int = 1) -> Datapoint:
+        return self
+    def adjust_brightness(self, brightness_factor: float) -> Datapoint:
+        return self
+    def adjust_saturation(self, saturation_factor: float) -> Datapoint:
+        return self
+    def adjust_contrast(self, contrast_factor: float) -> Datapoint:
+        return self
+    def adjust_sharpness(self, sharpness_factor: float) -> Datapoint:
+        return self
+    def adjust_hue(self, hue_factor: float) -> Datapoint:
+        return self
+    def adjust_gamma(self, gamma: float, gain: float = 1) -> Datapoint:
+        return self
+    def posterize(self, bits: int) -> Datapoint:
+        return self
+    def solarize(self, threshold: float) -> Datapoint:
+        return self
+    def autocontrast(self) -> Datapoint:
+        return self
+    def equalize(self) -> Datapoint:
+        return self
+    def invert(self) -> Datapoint:
+        return self
+    def gaussian_blur(self, kernel_size: List[int], sigma: Optional[List[float]] = None) -> Datapoint:
+        return self
+_InputType = Union[torch.Tensor, PIL.Image.Image, Datapoint]
+_InputTypeJIT = torch.Tensor

torchvision/datapoints/_dataset_wrapper.py ADDED Viewed

	@@ -0,0 +1,499 @@

+# type: ignore
+from __future__ import annotations
+import contextlib
+from collections import defaultdict
+import torch
+from torch.utils.data import Dataset
+from torchvision import datapoints, datasets
+from torchvision.transforms.v2 import functional as F
+__all__ = ["wrap_dataset_for_transforms_v2"]
+def wrap_dataset_for_transforms_v2(dataset):
+    """[BETA] Wrap a ``torchvision.dataset`` for usage with :mod:`torchvision.transforms.v2`.
+    .. v2betastatus:: wrap_dataset_for_transforms_v2 function
+    Example:
+        >>> dataset = torchvision.datasets.CocoDetection(...)
+        >>> dataset = wrap_dataset_for_transforms_v2(dataset)
+    .. note::
+       For now, only the most popular datasets are supported. Furthermore, the wrapper only supports dataset
+       configurations that are fully supported by ``torchvision.transforms.v2``. If you encounter an error prompting you
+       to raise an issue to ``torchvision`` for a dataset or configuration that you need, please do so.
+    The dataset samples are wrapped according to the description below.
+    Special cases:
+        * :class:`~torchvision.datasets.CocoDetection`: Instead of returning the target as list of dicts, the wrapper
+          returns a dict of lists. In addition, the key-value-pairs ``"boxes"`` (in ``XYXY`` coordinate format),
+          ``"masks"`` and ``"labels"`` are added and wrap the data in the corresponding ``torchvision.datapoints``.
+          The original keys are preserved.
+        * :class:`~torchvision.datasets.VOCDetection`: The key-value-pairs ``"boxes"`` and ``"labels"`` are added to
+          the target and wrap the data in the corresponding ``torchvision.datapoints``. The original keys are
+          preserved.
+        * :class:`~torchvision.datasets.CelebA`: The target for ``target_type="bbox"`` is converted to the ``XYXY``
+          coordinate format and wrapped into a :class:`~torchvision.datapoints.BoundingBox` datapoint.
+        * :class:`~torchvision.datasets.Kitti`: Instead returning the target as list of dictsthe wrapper returns a dict
+          of lists. In addition, the key-value-pairs ``"boxes"`` and ``"labels"`` are added and wrap the data
+          in the corresponding ``torchvision.datapoints``. The original keys are preserved.
+        * :class:`~torchvision.datasets.OxfordIIITPet`: The target for ``target_type="segmentation"`` is wrapped into a
+          :class:`~torchvision.datapoints.Mask` datapoint.
+        * :class:`~torchvision.datasets.Cityscapes`: The target for ``target_type="semantic"`` is wrapped into a
+          :class:`~torchvision.datapoints.Mask` datapoint. The target for ``target_type="instance"`` is *replaced* by
+          a dictionary with the key-value-pairs ``"masks"`` (as :class:`~torchvision.datapoints.Mask` datapoint) and
+          ``"labels"``.
+        * :class:`~torchvision.datasets.WIDERFace`: The value for key ``"bbox"`` in the target is converted to ``XYXY``
+          coordinate format and wrapped into a :class:`~torchvision.datapoints.BoundingBox` datapoint.
+    Image classification datasets
+        This wrapper is a no-op for image classification datasets, since they were already fully supported by
+        :mod:`torchvision.transforms` and thus no change is needed for :mod:`torchvision.transforms.v2`.
+    Segmentation datasets
+        Segmentation datasets, e.g. :class:`~torchvision.datasets.VOCSegmentation` return a two-tuple of
+        :class:`PIL.Image.Image`'s. This wrapper leaves the image as is (first item), while wrapping the
+        segmentation mask into a :class:`~torchvision.datapoints.Mask` (second item).
+    Video classification datasets
+        Video classification datasets, e.g. :class:`~torchvision.datasets.Kinetics` return a three-tuple containing a
+        :class:`torch.Tensor` for the video and audio and a :class:`int` as label. This wrapper wraps the video into a
+        :class:`~torchvision.datapoints.Video` while leaving the other items as is.
+        .. note::
+            Only datasets constructed with ``output_format="TCHW"`` are supported, since the alternative
+            ``output_format="THWC"`` is not supported by :mod:`torchvision.transforms.v2`.
+    Args:
+        dataset: the dataset instance to wrap for compatibility with transforms v2.
+    """
+    return VisionDatasetDatapointWrapper(dataset)
+class WrapperFactories(dict):
+    def register(self, dataset_cls):
+        def decorator(wrapper_factory):
+            self[dataset_cls] = wrapper_factory
+            return wrapper_factory
+        return decorator
+# We need this two-stage design, i.e. a wrapper factory producing the actual wrapper, since some wrappers depend on the
+# dataset instance rather than just the class, since they require the user defined instance attributes. Thus, we can
+# provide a wrapping from the dataset class to the factory here, but can only instantiate the wrapper at runtime when
+# we have access to the dataset instance.
+WRAPPER_FACTORIES = WrapperFactories()
+class VisionDatasetDatapointWrapper(Dataset):
+    def __init__(self, dataset):
+        dataset_cls = type(dataset)
+        if not isinstance(dataset, datasets.VisionDataset):
+            raise TypeError(
+                f"This wrapper is meant for subclasses of `torchvision.datasets.VisionDataset`, "
+                f"but got a '{dataset_cls.__name__}' instead."
+            )
+        for cls in dataset_cls.mro():
+            if cls in WRAPPER_FACTORIES:
+                wrapper_factory = WRAPPER_FACTORIES[cls]
+                break
+            elif cls is datasets.VisionDataset:
+                # TODO: If we have documentation on how to do that, put a link in the error message.
+                msg = f"No wrapper exists for dataset class {dataset_cls.__name__}. Please wrap the output yourself."
+                if dataset_cls in datasets.__dict__.values():
+                    msg = (
+                        f"{msg} If an automated wrapper for this dataset would be useful for you, "
+                        f"please open an issue at https://github.com/pytorch/vision/issues."
+                    )
+                raise TypeError(msg)
+        self._dataset = dataset
+        self._wrapper = wrapper_factory(dataset)
+        # We need to disable the transforms on the dataset here to be able to inject the wrapping before we apply them.
+        # Although internally, `datasets.VisionDataset` merges `transform` and `target_transform` into the joint
+        # `transforms`
+        # https://github.com/pytorch/vision/blob/135a0f9ea9841b6324b4fe8974e2543cbb95709a/torchvision/datasets/vision.py#L52-L54
+        # some (if not most) datasets still use `transform` and `target_transform` individually. Thus, we need to
+        # disable all three here to be able to extract the untransformed sample to wrap.
+        self.transform, dataset.transform = dataset.transform, None
+        self.target_transform, dataset.target_transform = dataset.target_transform, None
+        self.transforms, dataset.transforms = dataset.transforms, None
+    def __getattr__(self, item):
+        with contextlib.suppress(AttributeError):
+            return object.__getattribute__(self, item)
+        return getattr(self._dataset, item)
+    def __getitem__(self, idx):
+        # This gets us the raw sample since we disabled the transforms for the underlying dataset in the constructor
+        # of this class
+        sample = self._dataset[idx]
+        sample = self._wrapper(idx, sample)
+        # Regardless of whether the user has supplied the transforms individually (`transform` and `target_transform`)
+        # or joint (`transforms`), we can access the full functionality through `transforms`
+        if self.transforms is not None:
+            sample = self.transforms(*sample)
+        return sample
+    def __len__(self):
+        return len(self._dataset)
+def raise_not_supported(description):
+    raise RuntimeError(
+        f"{description} is currently not supported by this wrapper. "
+        f"If this would be helpful for you, please open an issue at https://github.com/pytorch/vision/issues."
+    )
+def identity(item):
+    return item
+def identity_wrapper_factory(dataset):
+    def wrapper(idx, sample):
+        return sample
+    return wrapper
+def pil_image_to_mask(pil_image):
+    return datapoints.Mask(pil_image)
+def list_of_dicts_to_dict_of_lists(list_of_dicts):
+    dict_of_lists = defaultdict(list)
+    for dct in list_of_dicts:
+        for key, value in dct.items():
+            dict_of_lists[key].append(value)
+    return dict(dict_of_lists)
+def wrap_target_by_type(target, *, target_types, type_wrappers):
+    if not isinstance(target, (tuple, list)):
+        target = [target]
+    wrapped_target = tuple(
+        type_wrappers.get(target_type, identity)(item) for target_type, item in zip(target_types, target)
+    )
+    if len(wrapped_target) == 1:
+        wrapped_target = wrapped_target[0]
+    return wrapped_target
+def classification_wrapper_factory(dataset):
+    return identity_wrapper_factory(dataset)
+for dataset_cls in [
+    datasets.Caltech256,
+    datasets.CIFAR10,
+    datasets.CIFAR100,
+    datasets.ImageNet,
+    datasets.MNIST,
+    datasets.FashionMNIST,
+    datasets.GTSRB,
+    datasets.DatasetFolder,
+    datasets.ImageFolder,
+]:
+    WRAPPER_FACTORIES.register(dataset_cls)(classification_wrapper_factory)
+def segmentation_wrapper_factory(dataset):
+    def wrapper(idx, sample):
+        image, mask = sample
+        return image, pil_image_to_mask(mask)
+    return wrapper
+for dataset_cls in [
+    datasets.VOCSegmentation,
+]:
+    WRAPPER_FACTORIES.register(dataset_cls)(segmentation_wrapper_factory)
+def video_classification_wrapper_factory(dataset):
+    if dataset.video_clips.output_format == "THWC":
+        raise RuntimeError(
+            f"{type(dataset).__name__} with `output_format='THWC'` is not supported by this wrapper, "
+            f"since it is not compatible with the transformations. Please use `output_format='TCHW'` instead."
+        )
+    def wrapper(idx, sample):
+        video, audio, label = sample
+        video = datapoints.Video(video)
+        return video, audio, label
+    return wrapper
+for dataset_cls in [
+    datasets.HMDB51,
+    datasets.Kinetics,
+    datasets.UCF101,
+]:
+    WRAPPER_FACTORIES.register(dataset_cls)(video_classification_wrapper_factory)
+@WRAPPER_FACTORIES.register(datasets.Caltech101)
+def caltech101_wrapper_factory(dataset):
+    if "annotation" in dataset.target_type:
+        raise_not_supported("Caltech101 dataset with `target_type=['annotation', ...]`")
+    return classification_wrapper_factory(dataset)
+@WRAPPER_FACTORIES.register(datasets.CocoDetection)
+def coco_dectection_wrapper_factory(dataset):
+    def segmentation_to_mask(segmentation, *, spatial_size):
+        from pycocotools import mask
+        segmentation = (
+            mask.frPyObjects(segmentation, *spatial_size)
+            if isinstance(segmentation, dict)
+            else mask.merge(mask.frPyObjects(segmentation, *spatial_size))
+        )
+        return torch.from_numpy(mask.decode(segmentation))
+    def wrapper(idx, sample):
+        image_id = dataset.ids[idx]
+        image, target = sample
+        if not target:
+            return image, dict(image_id=image_id)
+        batched_target = list_of_dicts_to_dict_of_lists(target)
+        batched_target["image_id"] = image_id
+        spatial_size = tuple(F.get_spatial_size(image))
+        batched_target["boxes"] = F.convert_format_bounding_box(
+            datapoints.BoundingBox(
+                batched_target["bbox"],
+                format=datapoints.BoundingBoxFormat.XYWH,
+                spatial_size=spatial_size,
+            ),
+            new_format=datapoints.BoundingBoxFormat.XYXY,
+        )
+        batched_target["masks"] = datapoints.Mask(
+            torch.stack(
+                [
+                    segmentation_to_mask(segmentation, spatial_size=spatial_size)
+                    for segmentation in batched_target["segmentation"]
+                ]
+            ),
+        )
+        batched_target["labels"] = torch.tensor(batched_target["category_id"])
+        return image, batched_target
+    return wrapper
+WRAPPER_FACTORIES.register(datasets.CocoCaptions)(identity_wrapper_factory)
+VOC_DETECTION_CATEGORIES = [
+    "__background__",
+    "aeroplane",
+    "bicycle",
+    "bird",
+    "boat",
+    "bottle",
+    "bus",
+    "car",
+    "cat",
+    "chair",
+    "cow",
+    "diningtable",
+    "dog",
+    "horse",
+    "motorbike",
+    "person",
+    "pottedplant",
+    "sheep",
+    "sofa",
+    "train",
+    "tvmonitor",
+]
+VOC_DETECTION_CATEGORY_TO_IDX = dict(zip(VOC_DETECTION_CATEGORIES, range(len(VOC_DETECTION_CATEGORIES))))
+@WRAPPER_FACTORIES.register(datasets.VOCDetection)
+def voc_detection_wrapper_factory(dataset):
+    def wrapper(idx, sample):
+        image, target = sample
+        batched_instances = list_of_dicts_to_dict_of_lists(target["annotation"]["object"])
+        target["boxes"] = datapoints.BoundingBox(
+            [
+                [int(bndbox[part]) for part in ("xmin", "ymin", "xmax", "ymax")]
+                for bndbox in batched_instances["bndbox"]
+            ],
+            format=datapoints.BoundingBoxFormat.XYXY,
+            spatial_size=(image.height, image.width),
+        )
+        target["labels"] = torch.tensor(
+            [VOC_DETECTION_CATEGORY_TO_IDX[category] for category in batched_instances["name"]]
+        )
+        return image, target
+    return wrapper
+@WRAPPER_FACTORIES.register(datasets.SBDataset)
+def sbd_wrapper(dataset):
+    if dataset.mode == "boundaries":
+        raise_not_supported("SBDataset with mode='boundaries'")
+    return segmentation_wrapper_factory(dataset)
+@WRAPPER_FACTORIES.register(datasets.CelebA)
+def celeba_wrapper_factory(dataset):
+    if any(target_type in dataset.target_type for target_type in ["attr", "landmarks"]):
+        raise_not_supported("`CelebA` dataset with `target_type=['attr', 'landmarks', ...]`")
+    def wrapper(idx, sample):
+        image, target = sample
+        target = wrap_target_by_type(
+            target,
+            target_types=dataset.target_type,
+            type_wrappers={
+                "bbox": lambda item: F.convert_format_bounding_box(
+                    datapoints.BoundingBox(
+                        item,
+                        format=datapoints.BoundingBoxFormat.XYWH,
+                        spatial_size=(image.height, image.width),
+                    ),
+                    new_format=datapoints.BoundingBoxFormat.XYXY,
+                ),
+            },
+        )
+        return image, target
+    return wrapper
+KITTI_CATEGORIES = ["Car", "Van", "Truck", "Pedestrian", "Person_sitting", "Cyclist", "Tram", "Misc", "DontCare"]
+KITTI_CATEGORY_TO_IDX = dict(zip(KITTI_CATEGORIES, range(len(KITTI_CATEGORIES))))
+@WRAPPER_FACTORIES.register(datasets.Kitti)
+def kitti_wrapper_factory(dataset):
+    def wrapper(idx, sample):
+        image, target = sample
+        if target is not None:
+            target = list_of_dicts_to_dict_of_lists(target)
+            target["boxes"] = datapoints.BoundingBox(
+                target["bbox"], format=datapoints.BoundingBoxFormat.XYXY, spatial_size=(image.height, image.width)
+            )
+            target["labels"] = torch.tensor([KITTI_CATEGORY_TO_IDX[category] for category in target["type"]])
+        return image, target
+    return wrapper
+@WRAPPER_FACTORIES.register(datasets.OxfordIIITPet)
+def oxford_iiit_pet_wrapper_factor(dataset):
+    def wrapper(idx, sample):
+        image, target = sample
+        if target is not None:
+            target = wrap_target_by_type(
+                target,
+                target_types=dataset._target_types,
+                type_wrappers={
+                    "segmentation": pil_image_to_mask,
+                },
+            )
+        return image, target
+    return wrapper
+@WRAPPER_FACTORIES.register(datasets.Cityscapes)
+def cityscapes_wrapper_factory(dataset):
+    if any(target_type in dataset.target_type for target_type in ["polygon", "color"]):
+        raise_not_supported("`Cityscapes` dataset with `target_type=['polygon', 'color', ...]`")
+    def instance_segmentation_wrapper(mask):
+        # See https://github.com/mcordts/cityscapesScripts/blob/8da5dd00c9069058ccc134654116aac52d4f6fa2/cityscapesscripts/preparation/json2instanceImg.py#L7-L21
+        data = pil_image_to_mask(mask)
+        masks = []
+        labels = []
+        for id in data.unique():
+            masks.append(data == id)
+            label = id
+            if label >= 1_000:
+                label //= 1_000
+            labels.append(label)
+        return dict(masks=datapoints.Mask(torch.stack(masks)), labels=torch.stack(labels))
+    def wrapper(idx, sample):
+        image, target = sample
+        target = wrap_target_by_type(
+            target,
+            target_types=dataset.target_type,
+            type_wrappers={
+                "instance": instance_segmentation_wrapper,
+                "semantic": pil_image_to_mask,
+            },
+        )
+        return image, target
+    return wrapper
+@WRAPPER_FACTORIES.register(datasets.WIDERFace)
+def widerface_wrapper(dataset):
+    def wrapper(idx, sample):
+        image, target = sample
+        if target is not None:
+            target["bbox"] = F.convert_format_bounding_box(
+                datapoints.BoundingBox(
+                    target["bbox"], format=datapoints.BoundingBoxFormat.XYWH, spatial_size=(image.height, image.width)
+                ),
+                new_format=datapoints.BoundingBoxFormat.XYXY,
+            )
+        return image, target
+    return wrapper

torchvision/datapoints/_image.py ADDED Viewed

	@@ -0,0 +1,260 @@

+from __future__ import annotations
+from typing import Any, List, Optional, Tuple, Union
+import PIL.Image
+import torch
+from torchvision.transforms.functional import InterpolationMode
+from ._datapoint import _FillTypeJIT, Datapoint
+class Image(Datapoint):
+    """[BETA] :class:`torch.Tensor` subclass for images.
+    Args:
+        data (tensor-like, PIL.Image.Image): Any data that can be turned into a tensor with :func:`torch.as_tensor` as
+            well as PIL images.
+        dtype (torch.dtype, optional): Desired data type of the bounding box. If omitted, will be inferred from
+            ``data``.
+        device (torch.device, optional): Desired device of the bounding box. If omitted and ``data`` is a
+            :class:`torch.Tensor`, the device is taken from it. Otherwise, the bounding box is constructed on the CPU.
+        requires_grad (bool, optional): Whether autograd should record operations on the bounding box. If omitted and
+            ``data`` is a :class:`torch.Tensor`, the value is taken from it. Otherwise, defaults to ``False``.
+    """
+    @classmethod
+    def _wrap(cls, tensor: torch.Tensor) -> Image:
+        image = tensor.as_subclass(cls)
+        return image
+    def __new__(
+        cls,
+        data: Any,
+        *,
+        dtype: Optional[torch.dtype] = None,
+        device: Optional[Union[torch.device, str, int]] = None,
+        requires_grad: Optional[bool] = None,
+    ) -> Image:
+        if isinstance(data, PIL.Image.Image):
+            from torchvision.transforms.v2 import functional as F
+            data = F.pil_to_tensor(data)
+        tensor = cls._to_tensor(data, dtype=dtype, device=device, requires_grad=requires_grad)
+        if tensor.ndim < 2:
+            raise ValueError
+        elif tensor.ndim == 2:
+            tensor = tensor.unsqueeze(0)
+        return cls._wrap(tensor)
+    @classmethod
+    def wrap_like(cls, other: Image, tensor: torch.Tensor) -> Image:
+        return cls._wrap(tensor)
+    def __repr__(self, *, tensor_contents: Any = None) -> str:  # type: ignore[override]
+        return self._make_repr()
+    @property
+    def spatial_size(self) -> Tuple[int, int]:
+        return tuple(self.shape[-2:])  # type: ignore[return-value]
+    @property
+    def num_channels(self) -> int:
+        return self.shape[-3]
+    def horizontal_flip(self) -> Image:
+        output = self._F.horizontal_flip_image_tensor(self.as_subclass(torch.Tensor))
+        return Image.wrap_like(self, output)
+    def vertical_flip(self) -> Image:
+        output = self._F.vertical_flip_image_tensor(self.as_subclass(torch.Tensor))
+        return Image.wrap_like(self, output)
+    def resize(  # type: ignore[override]
+        self,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        max_size: Optional[int] = None,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> Image:
+        output = self._F.resize_image_tensor(
+            self.as_subclass(torch.Tensor), size, interpolation=interpolation, max_size=max_size, antialias=antialias
+        )
+        return Image.wrap_like(self, output)
+    def crop(self, top: int, left: int, height: int, width: int) -> Image:
+        output = self._F.crop_image_tensor(self.as_subclass(torch.Tensor), top, left, height, width)
+        return Image.wrap_like(self, output)
+    def center_crop(self, output_size: List[int]) -> Image:
+        output = self._F.center_crop_image_tensor(self.as_subclass(torch.Tensor), output_size=output_size)
+        return Image.wrap_like(self, output)
+    def resized_crop(
+        self,
+        top: int,
+        left: int,
+        height: int,
+        width: int,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> Image:
+        output = self._F.resized_crop_image_tensor(
+            self.as_subclass(torch.Tensor),
+            top,
+            left,
+            height,
+            width,
+            size=list(size),
+            interpolation=interpolation,
+            antialias=antialias,
+        )
+        return Image.wrap_like(self, output)
+    def pad(
+        self,
+        padding: List[int],
+        fill: Optional[Union[int, float, List[float]]] = None,
+        padding_mode: str = "constant",
+    ) -> Image:
+        output = self._F.pad_image_tensor(self.as_subclass(torch.Tensor), padding, fill=fill, padding_mode=padding_mode)
+        return Image.wrap_like(self, output)
+    def rotate(
+        self,
+        angle: float,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        expand: bool = False,
+        center: Optional[List[float]] = None,
+        fill: _FillTypeJIT = None,
+    ) -> Image:
+        output = self._F.rotate_image_tensor(
+            self.as_subclass(torch.Tensor), angle, interpolation=interpolation, expand=expand, fill=fill, center=center
+        )
+        return Image.wrap_like(self, output)
+    def affine(
+        self,
+        angle: Union[int, float],
+        translate: List[float],
+        scale: float,
+        shear: List[float],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        fill: _FillTypeJIT = None,
+        center: Optional[List[float]] = None,
+    ) -> Image:
+        output = self._F.affine_image_tensor(
+            self.as_subclass(torch.Tensor),
+            angle,
+            translate=translate,
+            scale=scale,
+            shear=shear,
+            interpolation=interpolation,
+            fill=fill,
+            center=center,
+        )
+        return Image.wrap_like(self, output)
+    def perspective(
+        self,
+        startpoints: Optional[List[List[int]]],
+        endpoints: Optional[List[List[int]]],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        fill: _FillTypeJIT = None,
+        coefficients: Optional[List[float]] = None,
+    ) -> Image:
+        output = self._F.perspective_image_tensor(
+            self.as_subclass(torch.Tensor),
+            startpoints,
+            endpoints,
+            interpolation=interpolation,
+            fill=fill,
+            coefficients=coefficients,
+        )
+        return Image.wrap_like(self, output)
+    def elastic(
+        self,
+        displacement: torch.Tensor,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        fill: _FillTypeJIT = None,
+    ) -> Image:
+        output = self._F.elastic_image_tensor(
+            self.as_subclass(torch.Tensor), displacement, interpolation=interpolation, fill=fill
+        )
+        return Image.wrap_like(self, output)
+    def rgb_to_grayscale(self, num_output_channels: int = 1) -> Image:
+        output = self._F.rgb_to_grayscale_image_tensor(
+            self.as_subclass(torch.Tensor), num_output_channels=num_output_channels
+        )
+        return Image.wrap_like(self, output)
+    def adjust_brightness(self, brightness_factor: float) -> Image:
+        output = self._F.adjust_brightness_image_tensor(
+            self.as_subclass(torch.Tensor), brightness_factor=brightness_factor
+        )
+        return Image.wrap_like(self, output)
+    def adjust_saturation(self, saturation_factor: float) -> Image:
+        output = self._F.adjust_saturation_image_tensor(
+            self.as_subclass(torch.Tensor), saturation_factor=saturation_factor
+        )
+        return Image.wrap_like(self, output)
+    def adjust_contrast(self, contrast_factor: float) -> Image:
+        output = self._F.adjust_contrast_image_tensor(self.as_subclass(torch.Tensor), contrast_factor=contrast_factor)
+        return Image.wrap_like(self, output)
+    def adjust_sharpness(self, sharpness_factor: float) -> Image:
+        output = self._F.adjust_sharpness_image_tensor(
+            self.as_subclass(torch.Tensor), sharpness_factor=sharpness_factor
+        )
+        return Image.wrap_like(self, output)
+    def adjust_hue(self, hue_factor: float) -> Image:
+        output = self._F.adjust_hue_image_tensor(self.as_subclass(torch.Tensor), hue_factor=hue_factor)
+        return Image.wrap_like(self, output)
+    def adjust_gamma(self, gamma: float, gain: float = 1) -> Image:
+        output = self._F.adjust_gamma_image_tensor(self.as_subclass(torch.Tensor), gamma=gamma, gain=gain)
+        return Image.wrap_like(self, output)
+    def posterize(self, bits: int) -> Image:
+        output = self._F.posterize_image_tensor(self.as_subclass(torch.Tensor), bits=bits)
+        return Image.wrap_like(self, output)
+    def solarize(self, threshold: float) -> Image:
+        output = self._F.solarize_image_tensor(self.as_subclass(torch.Tensor), threshold=threshold)
+        return Image.wrap_like(self, output)
+    def autocontrast(self) -> Image:
+        output = self._F.autocontrast_image_tensor(self.as_subclass(torch.Tensor))
+        return Image.wrap_like(self, output)
+    def equalize(self) -> Image:
+        output = self._F.equalize_image_tensor(self.as_subclass(torch.Tensor))
+        return Image.wrap_like(self, output)
+    def invert(self) -> Image:
+        output = self._F.invert_image_tensor(self.as_subclass(torch.Tensor))
+        return Image.wrap_like(self, output)
+    def gaussian_blur(self, kernel_size: List[int], sigma: Optional[List[float]] = None) -> Image:
+        output = self._F.gaussian_blur_image_tensor(
+            self.as_subclass(torch.Tensor), kernel_size=kernel_size, sigma=sigma
+        )
+        return Image.wrap_like(self, output)
+    def normalize(self, mean: List[float], std: List[float], inplace: bool = False) -> Image:
+        output = self._F.normalize_image_tensor(self.as_subclass(torch.Tensor), mean=mean, std=std, inplace=inplace)
+        return Image.wrap_like(self, output)
+_ImageType = Union[torch.Tensor, PIL.Image.Image, Image]
+_ImageTypeJIT = torch.Tensor
+_TensorImageType = Union[torch.Tensor, Image]
+_TensorImageTypeJIT = torch.Tensor

torchvision/datapoints/_mask.py ADDED Viewed

	@@ -0,0 +1,158 @@

+from __future__ import annotations
+from typing import Any, List, Optional, Tuple, Union
+import PIL.Image
+import torch
+from torchvision.transforms import InterpolationMode
+from ._datapoint import _FillTypeJIT, Datapoint
+class Mask(Datapoint):
+    """[BETA] :class:`torch.Tensor` subclass for segmentation and detection masks.
+    Args:
+        data (tensor-like, PIL.Image.Image): Any data that can be turned into a tensor with :func:`torch.as_tensor` as
+            well as PIL images.
+        dtype (torch.dtype, optional): Desired data type of the bounding box. If omitted, will be inferred from
+            ``data``.
+        device (torch.device, optional): Desired device of the bounding box. If omitted and ``data`` is a
+            :class:`torch.Tensor`, the device is taken from it. Otherwise, the bounding box is constructed on the CPU.
+        requires_grad (bool, optional): Whether autograd should record operations on the bounding box. If omitted and
+            ``data`` is a :class:`torch.Tensor`, the value is taken from it. Otherwise, defaults to ``False``.
+    """
+    @classmethod
+    def _wrap(cls, tensor: torch.Tensor) -> Mask:
+        return tensor.as_subclass(cls)
+    def __new__(
+        cls,
+        data: Any,
+        *,
+        dtype: Optional[torch.dtype] = None,
+        device: Optional[Union[torch.device, str, int]] = None,
+        requires_grad: Optional[bool] = None,
+    ) -> Mask:
+        if isinstance(data, PIL.Image.Image):
+            from torchvision.transforms.v2 import functional as F
+            data = F.pil_to_tensor(data)
+        tensor = cls._to_tensor(data, dtype=dtype, device=device, requires_grad=requires_grad)
+        return cls._wrap(tensor)
+    @classmethod
+    def wrap_like(
+        cls,
+        other: Mask,
+        tensor: torch.Tensor,
+    ) -> Mask:
+        return cls._wrap(tensor)
+    @property
+    def spatial_size(self) -> Tuple[int, int]:
+        return tuple(self.shape[-2:])  # type: ignore[return-value]
+    def horizontal_flip(self) -> Mask:
+        output = self._F.horizontal_flip_mask(self.as_subclass(torch.Tensor))
+        return Mask.wrap_like(self, output)
+    def vertical_flip(self) -> Mask:
+        output = self._F.vertical_flip_mask(self.as_subclass(torch.Tensor))
+        return Mask.wrap_like(self, output)
+    def resize(  # type: ignore[override]
+        self,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        max_size: Optional[int] = None,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> Mask:
+        output = self._F.resize_mask(self.as_subclass(torch.Tensor), size, max_size=max_size)
+        return Mask.wrap_like(self, output)
+    def crop(self, top: int, left: int, height: int, width: int) -> Mask:
+        output = self._F.crop_mask(self.as_subclass(torch.Tensor), top, left, height, width)
+        return Mask.wrap_like(self, output)
+    def center_crop(self, output_size: List[int]) -> Mask:
+        output = self._F.center_crop_mask(self.as_subclass(torch.Tensor), output_size=output_size)
+        return Mask.wrap_like(self, output)
+    def resized_crop(
+        self,
+        top: int,
+        left: int,
+        height: int,
+        width: int,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> Mask:
+        output = self._F.resized_crop_mask(self.as_subclass(torch.Tensor), top, left, height, width, size=size)
+        return Mask.wrap_like(self, output)
+    def pad(
+        self,
+        padding: List[int],
+        fill: Optional[Union[int, float, List[float]]] = None,
+        padding_mode: str = "constant",
+    ) -> Mask:
+        output = self._F.pad_mask(self.as_subclass(torch.Tensor), padding, padding_mode=padding_mode, fill=fill)
+        return Mask.wrap_like(self, output)
+    def rotate(
+        self,
+        angle: float,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        expand: bool = False,
+        center: Optional[List[float]] = None,
+        fill: _FillTypeJIT = None,
+    ) -> Mask:
+        output = self._F.rotate_mask(self.as_subclass(torch.Tensor), angle, expand=expand, center=center, fill=fill)
+        return Mask.wrap_like(self, output)
+    def affine(
+        self,
+        angle: Union[int, float],
+        translate: List[float],
+        scale: float,
+        shear: List[float],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        fill: _FillTypeJIT = None,
+        center: Optional[List[float]] = None,
+    ) -> Mask:
+        output = self._F.affine_mask(
+            self.as_subclass(torch.Tensor),
+            angle,
+            translate=translate,
+            scale=scale,
+            shear=shear,
+            fill=fill,
+            center=center,
+        )
+        return Mask.wrap_like(self, output)
+    def perspective(
+        self,
+        startpoints: Optional[List[List[int]]],
+        endpoints: Optional[List[List[int]]],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        fill: _FillTypeJIT = None,
+        coefficients: Optional[List[float]] = None,
+    ) -> Mask:
+        output = self._F.perspective_mask(
+            self.as_subclass(torch.Tensor), startpoints, endpoints, fill=fill, coefficients=coefficients
+        )
+        return Mask.wrap_like(self, output)
+    def elastic(
+        self,
+        displacement: torch.Tensor,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        fill: _FillTypeJIT = None,
+    ) -> Mask:
+        output = self._F.elastic_mask(self.as_subclass(torch.Tensor), displacement, fill=fill)
+        return Mask.wrap_like(self, output)

torchvision/datapoints/_video.py ADDED Viewed

	@@ -0,0 +1,250 @@

+from __future__ import annotations
+from typing import Any, List, Optional, Tuple, Union
+import torch
+from torchvision.transforms.functional import InterpolationMode
+from ._datapoint import _FillTypeJIT, Datapoint
+class Video(Datapoint):
+    """[BETA] :class:`torch.Tensor` subclass for videos.
+    Args:
+        data (tensor-like): Any data that can be turned into a tensor with :func:`torch.as_tensor`.
+        dtype (torch.dtype, optional): Desired data type of the bounding box. If omitted, will be inferred from
+            ``data``.
+        device (torch.device, optional): Desired device of the bounding box. If omitted and ``data`` is a
+            :class:`torch.Tensor`, the device is taken from it. Otherwise, the bounding box is constructed on the CPU.
+        requires_grad (bool, optional): Whether autograd should record operations on the bounding box. If omitted and
+            ``data`` is a :class:`torch.Tensor`, the value is taken from it. Otherwise, defaults to ``False``.
+    """
+    @classmethod
+    def _wrap(cls, tensor: torch.Tensor) -> Video:
+        video = tensor.as_subclass(cls)
+        return video
+    def __new__(
+        cls,
+        data: Any,
+        *,
+        dtype: Optional[torch.dtype] = None,
+        device: Optional[Union[torch.device, str, int]] = None,
+        requires_grad: Optional[bool] = None,
+    ) -> Video:
+        tensor = cls._to_tensor(data, dtype=dtype, device=device, requires_grad=requires_grad)
+        if data.ndim < 4:
+            raise ValueError
+        return cls._wrap(tensor)
+    @classmethod
+    def wrap_like(cls, other: Video, tensor: torch.Tensor) -> Video:
+        return cls._wrap(tensor)
+    def __repr__(self, *, tensor_contents: Any = None) -> str:  # type: ignore[override]
+        return self._make_repr()
+    @property
+    def spatial_size(self) -> Tuple[int, int]:
+        return tuple(self.shape[-2:])  # type: ignore[return-value]
+    @property
+    def num_channels(self) -> int:
+        return self.shape[-3]
+    @property
+    def num_frames(self) -> int:
+        return self.shape[-4]
+    def horizontal_flip(self) -> Video:
+        output = self._F.horizontal_flip_video(self.as_subclass(torch.Tensor))
+        return Video.wrap_like(self, output)
+    def vertical_flip(self) -> Video:
+        output = self._F.vertical_flip_video(self.as_subclass(torch.Tensor))
+        return Video.wrap_like(self, output)
+    def resize(  # type: ignore[override]
+        self,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        max_size: Optional[int] = None,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> Video:
+        output = self._F.resize_video(
+            self.as_subclass(torch.Tensor),
+            size,
+            interpolation=interpolation,
+            max_size=max_size,
+            antialias=antialias,
+        )
+        return Video.wrap_like(self, output)
+    def crop(self, top: int, left: int, height: int, width: int) -> Video:
+        output = self._F.crop_video(self.as_subclass(torch.Tensor), top, left, height, width)
+        return Video.wrap_like(self, output)
+    def center_crop(self, output_size: List[int]) -> Video:
+        output = self._F.center_crop_video(self.as_subclass(torch.Tensor), output_size=output_size)
+        return Video.wrap_like(self, output)
+    def resized_crop(
+        self,
+        top: int,
+        left: int,
+        height: int,
+        width: int,
+        size: List[int],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        antialias: Optional[Union[str, bool]] = "warn",
+    ) -> Video:
+        output = self._F.resized_crop_video(
+            self.as_subclass(torch.Tensor),
+            top,
+            left,
+            height,
+            width,
+            size=list(size),
+            interpolation=interpolation,
+            antialias=antialias,
+        )
+        return Video.wrap_like(self, output)
+    def pad(
+        self,
+        padding: List[int],
+        fill: Optional[Union[int, float, List[float]]] = None,
+        padding_mode: str = "constant",
+    ) -> Video:
+        output = self._F.pad_video(self.as_subclass(torch.Tensor), padding, fill=fill, padding_mode=padding_mode)
+        return Video.wrap_like(self, output)
+    def rotate(
+        self,
+        angle: float,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        expand: bool = False,
+        center: Optional[List[float]] = None,
+        fill: _FillTypeJIT = None,
+    ) -> Video:
+        output = self._F.rotate_video(
+            self.as_subclass(torch.Tensor), angle, interpolation=interpolation, expand=expand, fill=fill, center=center
+        )
+        return Video.wrap_like(self, output)
+    def affine(
+        self,
+        angle: Union[int, float],
+        translate: List[float],
+        scale: float,
+        shear: List[float],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.NEAREST,
+        fill: _FillTypeJIT = None,
+        center: Optional[List[float]] = None,
+    ) -> Video:
+        output = self._F.affine_video(
+            self.as_subclass(torch.Tensor),
+            angle,
+            translate=translate,
+            scale=scale,
+            shear=shear,
+            interpolation=interpolation,
+            fill=fill,
+            center=center,
+        )
+        return Video.wrap_like(self, output)
+    def perspective(
+        self,
+        startpoints: Optional[List[List[int]]],
+        endpoints: Optional[List[List[int]]],
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        fill: _FillTypeJIT = None,
+        coefficients: Optional[List[float]] = None,
+    ) -> Video:
+        output = self._F.perspective_video(
+            self.as_subclass(torch.Tensor),
+            startpoints,
+            endpoints,
+            interpolation=interpolation,
+            fill=fill,
+            coefficients=coefficients,
+        )
+        return Video.wrap_like(self, output)
+    def elastic(
+        self,
+        displacement: torch.Tensor,
+        interpolation: Union[InterpolationMode, int] = InterpolationMode.BILINEAR,
+        fill: _FillTypeJIT = None,
+    ) -> Video:
+        output = self._F.elastic_video(
+            self.as_subclass(torch.Tensor), displacement, interpolation=interpolation, fill=fill
+        )
+        return Video.wrap_like(self, output)
+    def rgb_to_grayscale(self, num_output_channels: int = 1) -> Video:
+        output = self._F.rgb_to_grayscale_image_tensor(
+            self.as_subclass(torch.Tensor), num_output_channels=num_output_channels
+        )
+        return Video.wrap_like(self, output)
+    def adjust_brightness(self, brightness_factor: float) -> Video:
+        output = self._F.adjust_brightness_video(self.as_subclass(torch.Tensor), brightness_factor=brightness_factor)
+        return Video.wrap_like(self, output)
+    def adjust_saturation(self, saturation_factor: float) -> Video:
+        output = self._F.adjust_saturation_video(self.as_subclass(torch.Tensor), saturation_factor=saturation_factor)
+        return Video.wrap_like(self, output)
+    def adjust_contrast(self, contrast_factor: float) -> Video:
+        output = self._F.adjust_contrast_video(self.as_subclass(torch.Tensor), contrast_factor=contrast_factor)
+        return Video.wrap_like(self, output)
+    def adjust_sharpness(self, sharpness_factor: float) -> Video:
+        output = self._F.adjust_sharpness_video(self.as_subclass(torch.Tensor), sharpness_factor=sharpness_factor)
+        return Video.wrap_like(self, output)
+    def adjust_hue(self, hue_factor: float) -> Video:
+        output = self._F.adjust_hue_video(self.as_subclass(torch.Tensor), hue_factor=hue_factor)
+        return Video.wrap_like(self, output)
+    def adjust_gamma(self, gamma: float, gain: float = 1) -> Video:
+        output = self._F.adjust_gamma_video(self.as_subclass(torch.Tensor), gamma=gamma, gain=gain)
+        return Video.wrap_like(self, output)
+    def posterize(self, bits: int) -> Video:
+        output = self._F.posterize_video(self.as_subclass(torch.Tensor), bits=bits)
+        return Video.wrap_like(self, output)
+    def solarize(self, threshold: float) -> Video:
+        output = self._F.solarize_video(self.as_subclass(torch.Tensor), threshold=threshold)
+        return Video.wrap_like(self, output)
+    def autocontrast(self) -> Video:
+        output = self._F.autocontrast_video(self.as_subclass(torch.Tensor))
+        return Video.wrap_like(self, output)
+    def equalize(self) -> Video:
+        output = self._F.equalize_video(self.as_subclass(torch.Tensor))
+        return Video.wrap_like(self, output)
+    def invert(self) -> Video:
+        output = self._F.invert_video(self.as_subclass(torch.Tensor))
+        return Video.wrap_like(self, output)
+    def gaussian_blur(self, kernel_size: List[int], sigma: Optional[List[float]] = None) -> Video:
+        output = self._F.gaussian_blur_video(self.as_subclass(torch.Tensor), kernel_size=kernel_size, sigma=sigma)
+        return Video.wrap_like(self, output)
+    def normalize(self, mean: List[float], std: List[float], inplace: bool = False) -> Video:
+        output = self._F.normalize_video(self.as_subclass(torch.Tensor), mean=mean, std=std, inplace=inplace)
+        return Video.wrap_like(self, output)
+_VideoType = Union[torch.Tensor, Video]
+_VideoTypeJIT = torch.Tensor
+_TensorVideoType = Union[torch.Tensor, Video]
+_TensorVideoTypeJIT = torch.Tensor

torchvision/datasets/__init__.py ADDED Viewed

	@@ -0,0 +1,145 @@

+from ._optical_flow import FlyingChairs, FlyingThings3D, HD1K, KittiFlow, Sintel
+from ._stereo_matching import (
+    CarlaStereo,
+    CREStereo,
+    ETH3DStereo,
+    FallingThingsStereo,
+    InStereo2k,
+    Kitti2012Stereo,
+    Kitti2015Stereo,
+    Middlebury2014Stereo,
+    SceneFlowStereo,
+    SintelStereo,
+)
+from .caltech import Caltech101, Caltech256
+from .celeba import CelebA
+from .cifar import CIFAR10, CIFAR100
+from .cityscapes import Cityscapes
+from .clevr import CLEVRClassification
+from .coco import CocoCaptions, CocoDetection
+from .country211 import Country211
+from .dtd import DTD
+from .eurosat import EuroSAT
+from .fakedata import FakeData
+from .fer2013 import FER2013
+from .fgvc_aircraft import FGVCAircraft
+from .flickr import Flickr30k, Flickr8k
+from .flowers102 import Flowers102
+from .folder import DatasetFolder, ImageFolder
+from .food101 import Food101
+from .gtsrb import GTSRB
+from .hmdb51 import HMDB51
+from .imagenet import ImageNet
+from .inaturalist import INaturalist
+from .kinetics import Kinetics
+from .kitti import Kitti
+from .lfw import LFWPairs, LFWPeople
+from .lsun import LSUN, LSUNClass
+from .mnist import EMNIST, FashionMNIST, KMNIST, MNIST, QMNIST
+from .moving_mnist import MovingMNIST
+from .omniglot import Omniglot
+from .oxford_iiit_pet import OxfordIIITPet
+from .pcam import PCAM
+from .phototour import PhotoTour
+from .places365 import Places365
+from .rendered_sst2 import RenderedSST2
+from .sbd import SBDataset
+from .sbu import SBU
+from .semeion import SEMEION
+from .stanford_cars import StanfordCars
+from .stl10 import STL10
+from .sun397 import SUN397
+from .svhn import SVHN
+from .ucf101 import UCF101
+from .usps import USPS
+from .vision import VisionDataset
+from .voc import VOCDetection, VOCSegmentation
+from .widerface import WIDERFace
+__all__ = (
+    "LSUN",
+    "LSUNClass",
+    "ImageFolder",
+    "DatasetFolder",
+    "FakeData",
+    "CocoCaptions",
+    "CocoDetection",
+    "CIFAR10",
+    "CIFAR100",
+    "EMNIST",
+    "FashionMNIST",
+    "QMNIST",
+    "MNIST",
+    "KMNIST",
+    "StanfordCars",
+    "STL10",
+    "SUN397",
+    "SVHN",
+    "PhotoTour",
+    "SEMEION",
+    "Omniglot",
+    "SBU",
+    "Flickr8k",
+    "Flickr30k",
+    "Flowers102",
+    "VOCSegmentation",
+    "VOCDetection",
+    "Cityscapes",
+    "ImageNet",
+    "Caltech101",
+    "Caltech256",
+    "CelebA",
+    "WIDERFace",
+    "SBDataset",
+    "VisionDataset",
+    "USPS",
+    "Kinetics",
+    "HMDB51",
+    "UCF101",
+    "Places365",
+    "Kitti",
+    "INaturalist",
+    "LFWPeople",
+    "LFWPairs",
+    "KittiFlow",
+    "Sintel",
+    "FlyingChairs",
+    "FlyingThings3D",
+    "HD1K",
+    "Food101",
+    "DTD",
+    "FER2013",
+    "GTSRB",
+    "CLEVRClassification",
+    "OxfordIIITPet",
+    "PCAM",
+    "Country211",
+    "FGVCAircraft",
+    "EuroSAT",
+    "RenderedSST2",
+    "Kitti2012Stereo",
+    "Kitti2015Stereo",
+    "CarlaStereo",
+    "Middlebury2014Stereo",
+    "CREStereo",
+    "FallingThingsStereo",
+    "SceneFlowStereo",
+    "SintelStereo",
+    "InStereo2k",
+    "ETH3DStereo",
+)
+# We override current module's attributes to handle the import:
+# from torchvision.datasets import wrap_dataset_for_transforms_v2
+# with beta state v2 warning from torchvision.datapoints
+# We also want to avoid raising the warning when importing other attributes
+# from torchvision.datasets
+# Ref: https://peps.python.org/pep-0562/
+def __getattr__(name):
+    if name in ("wrap_dataset_for_transforms_v2",):
+        from torchvision.datapoints._dataset_wrapper import wrap_dataset_for_transforms_v2
+        return wrap_dataset_for_transforms_v2
+    raise AttributeError(f"module {__name__!r} has no attribute {name!r}")

torchvision/datasets/__pycache__/__init__.cpython-38.pyc ADDED Viewed

Binary file (3.28 kB). View file

torchvision/datasets/__pycache__/_optical_flow.cpython-38.pyc ADDED Viewed

Binary file (17.6 kB). View file

torchvision/datasets/__pycache__/_stereo_matching.cpython-38.pyc ADDED Viewed

Binary file (40.2 kB). View file

torchvision/datasets/__pycache__/caltech.cpython-38.pyc ADDED Viewed

Binary file (8.1 kB). View file

torchvision/datasets/__pycache__/celeba.cpython-38.pyc ADDED Viewed

Binary file (7.14 kB). View file

torchvision/datasets/__pycache__/cifar.cpython-38.pyc ADDED Viewed

Binary file (5.81 kB). View file

torchvision/datasets/__pycache__/cityscapes.cpython-38.pyc ADDED Viewed

Binary file (8.41 kB). View file

torchvision/datasets/__pycache__/clevr.cpython-38.pyc ADDED Viewed

Binary file (4.11 kB). View file

torchvision/datasets/__pycache__/coco.cpython-38.pyc ADDED Viewed

Binary file (5.02 kB). View file

torchvision/datasets/__pycache__/country211.cpython-38.pyc ADDED Viewed

Binary file (2.79 kB). View file

torchvision/datasets/__pycache__/dtd.cpython-38.pyc ADDED Viewed

Binary file (4.33 kB). View file

torchvision/datasets/__pycache__/eurosat.cpython-38.pyc ADDED Viewed

Binary file (2.46 kB). View file

torchvision/datasets/__pycache__/fakedata.cpython-38.pyc ADDED Viewed

Binary file (2.67 kB). View file

torchvision/datasets/__pycache__/fer2013.cpython-38.pyc ADDED Viewed

Binary file (3.3 kB). View file

torchvision/datasets/__pycache__/fgvc_aircraft.cpython-38.pyc ADDED Viewed

Binary file (4.72 kB). View file

torchvision/datasets/__pycache__/flickr.cpython-38.pyc ADDED Viewed

Binary file (5.27 kB). View file

torchvision/datasets/__pycache__/flowers102.cpython-38.pyc ADDED Viewed

Binary file (4.6 kB). View file

torchvision/datasets/__pycache__/folder.cpython-38.pyc ADDED Viewed

Binary file (11.5 kB). View file

torchvision/datasets/__pycache__/food101.cpython-38.pyc ADDED Viewed

Binary file (4.35 kB). View file

torchvision/datasets/__pycache__/gtsrb.cpython-38.pyc ADDED Viewed

Binary file (3.74 kB). View file

torchvision/datasets/__pycache__/hmdb51.cpython-38.pyc ADDED Viewed

Binary file (5.64 kB). View file

torchvision/datasets/__pycache__/imagenet.cpython-38.pyc ADDED Viewed

Binary file (9.69 kB). View file

torchvision/datasets/__pycache__/inaturalist.cpython-38.pyc ADDED Viewed

Binary file (8.59 kB). View file

torchvision/datasets/__pycache__/kinetics.cpython-38.pyc ADDED Viewed

Binary file (9.66 kB). View file