| from datasets import load_dataset | |
| from config import DATASET_EN_ES | |
| def load_and_prepare(): | |
| dataset = load_dataset(DATASET_EN_ES) | |
| def format_example(example): | |
| return { | |
| "source": example["term"]["en"], | |
| "target": example["term"]["es"] | |
| } | |
| dataset = dataset.map(format_example) | |
| return dataset | |
| if __name__ == "__main__": | |
| ds = load_and_prepare() | |
| print(ds["train"][0]) |