{ "version": "1.0", "truncation": { "max_length": 65536, "strategy": "longest_first", "direction": "right" }, "padding": { "strategy": "right", "pad_id": 0, "pad_token": "" }, "added_tokens": [ {"id": 0, "content": "", "single_word": false, "special": true}, {"id": 1, "content": "", "single_word": false, "special": true}, {"id": 2, "content": "", "single_word": false, "special": true} ], "normalizer": { "type": "NFKC" }, "pre_tokenizer": { "type": "Whitespace" }, "post_processor": { "type": "TemplateProcessing", "single": " $A ", "pair": " $A $B ", "special_tokens": { "": 1, "": 2 } }, "decoder": { "type": "WordPiece", "prefix": "##" }, "model": { "type": "BPE", "vocab": { "": 0, "": 1, "": 2, "the": 3, "of": 4, "to": 5, "and": 6, "I": 7, "you": 8 }, "merges": [ "t h", "th e", "a n", "a nd", "i n", "i ng" ] } }