Hypa-Whisper-small-2026-03-26-Randy / tokenizer_config.json
hypaai's picture
Training in progress, step 50
96b4731 verified
raw
history blame contribute delete
611 Bytes
{
"add_prefix_space": false,
"backend": "tokenizers",
"bos_token": "<|endoftext|>",
"clean_up_tokenization_spaces": true,
"eos_token": "<|endoftext|>",
"errors": "replace",
"extra_special_tokens": [
"<|ig|>",
"<|iga|>",
"<|an|>",
"<|tiv|>"
],
"is_local": false,
"language": "english",
"model_max_length": 1024,
"pad_token": "<|endoftext|>",
"padding_side": "left",
"predict_timestamps": false,
"processor_class": "WhisperProcessor",
"return_attention_mask": false,
"task": "transcribe",
"tokenizer_class": "WhisperTokenizer",
"unk_token": "<|endoftext|>"
}