File size: 329 Bytes
3254881 | 1 2 3 4 5 6 7 8 9 10 11 12 | from datasets import load_dataset
# Download the OpenAssistant dataset
dataset = load_dataset("OpenAssistant/oasst1", split="train")
# Keep only French conversations
dataset = dataset.filter(lambda x: x["lang"] == "fr")
# Print an example to check if it's correct
print("Example conversation from dataset:")
print(dataset[0])
|