from datasets import load_dataset | |
from PIL import Image | |
dataset_name = "image_caption_dataset.py" | |
dataset_config_name = "coco_2017" | |
cache_dir = None | |
keep_in_memory = False | |
data_dir = "./" | |
dataset = load_dataset( | |
dataset_name, dataset_config_name, cache_dir=cache_dir, keep_in_memory=keep_in_memory, data_dir=data_dir | |
) | |
for example in dataset["train"]: | |
print(example) | |
# with Image.open(example['image_file']) as image: | |
# image.show() | |
break | |
for _idx, example in enumerate(dataset["validation"]): | |
if _idx >= 5: | |
break | |
print(example) | |
with Image.open(example['image_file']) as image: | |
image.show() | |