Spaces:
Runtime error
Runtime error
import argparse | |
from datasets import load_dataset, concatenate_datasets | |
def main(args): | |
dss = [] | |
for dataset_path in args.dataset: | |
dataset = load_dataset(dataset_path, split="train", data_files="*.arrow") | |
dss.append(dataset) | |
ds = concatenate_datasets(dss) | |
ds = ds.shuffle() | |
ds.save_to_disk(args.output_folder) | |
if __name__ == "__main__": | |
parser = argparse.ArgumentParser() | |
parser.add_argument("-d", "--dataset", type=str, action="append") | |
parser.add_argument("-o", "--output_folder", type=str) | |
args = parser.parse_args() | |
main(args) | |