Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
#!/usr/bin/env python3 | |
import json | |
from datasets import Dataset, DatasetDict | |
file_path = "shroom-data/val.model-agnostic.json" | |
ds_path = 'pminervini/shroom' | |
with open(file_path, 'r') as file: | |
data = json.load(file) | |
def convert(list_of_dicts): | |
dict_of_lists = {} | |
for d in list_of_dicts: | |
for key, value in d.items(): | |
dict_of_lists.setdefault(key, []).append(value) | |
return dict_of_lists | |
task_to_data_map = {} | |
for entry in data: | |
task_name = entry["task"] | |
del entry["task"] | |
if task_name not in task_to_data_map: | |
task_to_data_map[task_name] = [] | |
task_to_data_map[task_name] += [entry] | |
task_to_ds_map = {k: Dataset.from_dict(convert(data)) for k, data in task_to_data_map.items()} | |
ds_dict = DatasetDict(task_to_ds_map) | |
ds_dict.push_to_hub(ds_path) | |