File size: 648 Bytes
8ffa189
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
from datasets import load_dataset
from PIL import Image


dataset_name = "image_caption_dataset.py"
dataset_config_name = "coco_2017"
cache_dir = None
keep_in_memory = False
data_dir = "./"

dataset = load_dataset(
    dataset_name, dataset_config_name, cache_dir=cache_dir, keep_in_memory=keep_in_memory, data_dir=data_dir
)

for example in dataset["train"]:
    print(example)
    # with Image.open(example['image_file']) as image:
    #     image.show()
    break

for _idx, example in enumerate(dataset["validation"]):
    if _idx >= 5:
        break
    print(example)
    with Image.open(example['image_file']) as image:
        image.show()