from datasets import load_dataset dataset = load_dataset("json", data_files="dataset.json") print(dataset) print(dataset["train"][0]) def to_chat_format(example); return { "text": f"User": {example["preguntas"][0]}