Urdu-Tokenizer / tokenizer_config.json
zuhri025's picture
Upload tokenizer
8fa2160 verified
raw
history blame contribute delete
672 Bytes
{
"backend": "tokenizers",
"bos_token": "<|bos|>",
"eos_token": "<|eos|>",
"extra_special_tokens": [
"<|pad|>",
"<|unk|>",
"<|bos|>",
"<|eos|>",
"<|start_of_speech|>",
"<|end_of_speech|>",
"<|start_of_text|>",
"<|end_of_text|>",
"<|speech|>",
"<|sep|>",
"<|alloy|>",
"<|amuch|>",
"<|ash|>",
"<|ballad|>",
"<|coral|>",
"<|dan|>",
"<|echo|>",
"<|fable|>",
"<|nova|>",
"<|onyx|>",
"<|sage|>",
"<|shimmer|>",
"<|verse|>"
],
"model_max_length": 1000000000000000019884624838656,
"pad_token": "<|pad|>",
"tokenizer_class": "TokenizersBackend",
"unk_token": "<|unk|>"
}