File size: 812 Bytes
14e4843 d6d7ec6 14e4843 d6d7ec6 14e4843 d6d7ec6 14e4843 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 |
#!/usr/bin/env python3
import json
from datasets import Dataset, DatasetDict
file_path = "shroom-data/val.model-agnostic.json"
ds_path = "pminervini/shroom"
with open(file_path, "r") as file:
data = json.load(file)
def convert(list_of_dicts):
dict_of_lists = {}
for d in list_of_dicts:
for key, value in d.items():
dict_of_lists.setdefault(key, []).append(value)
return dict_of_lists
task_to_data_map = {}
for entry in data:
task_name = entry["task"]
del entry["task"]
if task_name not in task_to_data_map:
task_to_data_map[task_name] = []
task_to_data_map[task_name] += [entry]
task_to_ds_map = {k: Dataset.from_dict(convert(data)) for k, data in task_to_data_map.items()}
ds_dict = DatasetDict(task_to_ds_map)
ds_dict.push_to_hub(ds_path)
|