File size: 427 Bytes
d9cc673
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
from datasets import load_dataset
from config import DATASET_EN_ES

def load_and_prepare():
    dataset = load_dataset(DATASET_EN_ES)

    def format_example(example):
        return {
            "source": example["term"]["en"],
            "target": example["term"]["es"]
        }

    dataset = dataset.map(format_example)
    return dataset

if __name__ == "__main__":
    ds = load_and_prepare()
    print(ds["train"][0])