NedoTurkishTokenizer / tokenizer_config.json
nmstech's picture
Rename project from TurkTokenizer to NedoTurkishTokenizer
cfffd93
{
"tokenizer_class": "NedoTurkishTokenizer",
"model_type": "nedo-turkish-tokenizer",
"auto_map": {
"AutoTokenizer": ["tokenization_nedo_turkish.NedoTurkishTokenizer", null]
},
"version": "1.0.0",
"language": "tr",
"description": "Turkish morphological tokenizer — TR-MMLU world record 92%",
"requires_java": true,
"dependencies": ["turkish-tokenizer", "jpype1"]
}