LightOnOCR-4bit / tokenizer_config.json
humpf's picture
Upload folder using huggingface_hub
1835135 verified
{
"add_prefix_space": false,
"backend": "tokenizers",
"bos_token": null,
"clean_up_tokenization_spaces": false,
"eos_token": "<|im_end|>",
"errors": "replace",
"image_break_token": "<|vision_pad|>",
"image_end_token": "<|vision_end|>",
"image_token": "<|image_pad|>",
"is_local": true,
"local_files_only": false,
"max_length": null,
"model_max_length": 131072,
"model_specific_special_tokens": {
"image_break_token": "<|vision_pad|>",
"image_end_token": "<|vision_end|>",
"image_token": "<|image_pad|>"
},
"pad_to_multiple_of": null,
"pad_token": "<|endoftext|>",
"pad_token_type_id": 0,
"padding_side": "right",
"processor_class": "Mistral3Processor",
"split_special_tokens": false,
"tokenizer_class": "TokenizersBackend",
"unk_token": null
}