bitmar-attention-multimodal / tokenizer_config.json
estebancarlin's picture
Initial upload: BitMar Epoch 1 - 99,686,013 tokens processed
60b91bb verified
raw
history blame
399 Bytes
{
"tokenizer_class": "GPT2Tokenizer",
"auto_map": {
"AutoTokenizer": ["transformers", "GPT2Tokenizer"]
},
"bos_token": "<|endoftext|>",
"eos_token": "<|endoftext|>",
"pad_token": "<|endoftext|>",
"unk_token": "<|endoftext|>",
"add_prefix_space": false,
"model_max_length": 1024,
"special_tokens_map_file": null,
"name_or_path": "gpt2",
"tokenizer_type": "GPT2Tokenizer"
}