{ "clean_up_tokenization_spaces": true, "model_max_length": 512, "special_tokens": [ "[PAD]", "[SEP]", "[CLS]", "[UNK]" ], "tokenizer_class": "PreTrainedTokenizerFast" }