File size: 319 Bytes
bde1c71
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
# src/evaluators/transliteration/datasets.py
TRANSLITERATION_DATASETS = {
    "madar-tun": {
        "path": "tunis-ai/MADAR-TUN",
        "split": "test",
        "source_col": "arabish",   # Latin
        "target_col": "words",     # Arabic script
        "description": "MADAR-TUN: Arabizi ↔ Arabic script"
    }
}