base_IIXIV / tokenizer_config.json
mainline777's picture
Duplicate from silx-ai/Quasar-Preview
41865df
Raw
History Blame Contribute Delete
488 Bytes
{
"backend": "tokenizers",
"bos_token": "<|startoftext|>",
"clean_up_tokenization_spaces": false,
"cls_token": "[CLS]",
"eos_token": "<|endoftext|>",
"fast_tokenizer": true,
"gmask_token": "[gMASK]",
"is_local": false,
"local_files_only": false,
"merges_file": null,
"model_max_length": 1000000000000000019884624838656,
"model_specific_special_tokens": {
"gmask_token": "[gMASK]"
},
"pad_token": "<|endoftext|>",
"tokenizer_class": "TokenizersBackend"
}