{ "tokenizer_class": "PreTrainedTokenizerFast", "model_max_length": 512, "bos_token": "<|startoftext|>", "eos_token": "<|endoftext|>", "pad_token": "<|pad|>", "unk_token": "<|unk|>", "clean_up_tokenization_spaces": true }