llama3_baseline / tokenizer_config.json
smithblack-0's picture
Update architecture and tokenizer
e6fbdc8 verified
raw
history blame contribute delete
352 Bytes
{
"add_prefix_space": false,
"backend": "tokenizers",
"bos_token": "<|endoftext|>",
"eos_token": "<|endoftext|>",
"errors": "replace",
"is_local": false,
"model_max_length": 1000000000000000019884624838656,
"pad_token": "<|padding|>",
"tokenizer_class": "GPTNeoXTokenizerFast",
"trim_offsets": true,
"unk_token": "<|endoftext|>"
}