from datasets import load_dataset | |
# Download the OpenAssistant dataset | |
dataset = load_dataset("OpenAssistant/oasst1", split="train") | |
# Keep only French conversations | |
dataset = dataset.filter(lambda x: x["lang"] == "fr") | |
# Print an example to check if it's correct | |
print("Example conversation from dataset:") | |
print(dataset[0]) | |