Source code for datasets.filesystems

import importlib

import fsspec


_has_s3fs = importlib.util.find_spec("s3fs") is not None

if _has_s3fs:
    from .s3filesystem import S3FileSystem  # noqa: F401


[docs]def extract_path_from_uri(dataset_path: str) -> str: """ preprocesses `dataset_path` and removes remote filesystem (e.g. removing ``s3://``) Args: dataset_path (``str``): path (e.g. ``dataset/train``) or remote uri (e.g. ``s3://my-bucket/dataset/train``) of the dataset directory """ if "://" in dataset_path: dataset_path = dataset_path.split("://")[1] return dataset_path
[docs]def is_remote_filesystem(fs: fsspec.spec.AbstractFileSystem) -> bool: """ Validates if filesystem has remote protocol. Args: fs (``fsspec.spec.AbstractFileSystem``): An abstract super-class for pythonic file-systems, e.g. :code:`fsspec.filesystem(\'file\')` or :class:`datasets.filesystem.S3FileSystem` """ if fs is not None and fs.protocol != "file": return True else: return False