vit-gpt2 / test_coco_dataset_script.py
ydshieh
update model.py and add coco files
a99072f
raw history blame
No virus
451 Bytes
import csv
import json
import os
import datasets
import pandas as pd
import numpy as np
ds = datasets.load_dataset('./coco_dataset_script.py', data_dir='/home/33611/caption/')
ds = ds['train']
def transform(example):
example['pixel_values'] = np.load(example['pixels_file'])
return example
# ds = ds.map(transform)
n = 0
for x in ds:
n += 1
assert os.path.isfile(x['image_file'])
if n == 10:
print(x)
break