FireRedLID-vllm / tokenizer_config.json
PatchyTisa's picture
Add files using upload-large-folder tool
1d67dac verified
{
"tokenizer_class": "PreTrainedTokenizerFast",
"model_type": "fireredlid",
"bos_token": "<sos>",
"eos_token": "<eos>",
"unk_token": "<unk>",
"pad_token": "<pad>",
"added_tokens_decoder": {
"0": {
"content": "<blank>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
"1": {
"content": "<unk>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
"2": {
"content": "<pad>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
"3": {
"content": "<sos>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
"4": {
"content": "<eos>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
"5": {
"content": "en",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"6": {
"content": "es",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"7": {
"content": "fr",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"8": {
"content": "zh",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"9": {
"content": "other",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"10": {
"content": "xinan",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"11": {
"content": "ja",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"12": {
"content": "ko",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"13": {
"content": "ru",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"14": {
"content": "mandarin",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"15": {
"content": "min",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"16": {
"content": "wu",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"17": {
"content": "xiang",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"18": {
"content": "yue",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"19": {
"content": "north",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"20": {
"content": "de",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"21": {
"content": "pt",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"22": {
"content": "ab",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"23": {
"content": "af",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"24": {
"content": "am",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"25": {
"content": "ar",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"26": {
"content": "as",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"27": {
"content": "az",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"28": {
"content": "ba",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"29": {
"content": "be",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"30": {
"content": "bg",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"31": {
"content": "bn",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"32": {
"content": "br",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"33": {
"content": "ca",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"34": {
"content": "cs",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"35": {
"content": "cy",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"36": {
"content": "da",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"37": {
"content": "el",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"38": {
"content": "eo",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"39": {
"content": "et",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"40": {
"content": "eu",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"41": {
"content": "fa",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"42": {
"content": "gl",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"43": {
"content": "gn",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"44": {
"content": "ha",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"45": {
"content": "iw",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"46": {
"content": "hi",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"47": {
"content": "ht",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"48": {
"content": "hu",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"49": {
"content": "hy",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"50": {
"content": "ia",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"51": {
"content": "id",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"52": {
"content": "is",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"53": {
"content": "it",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"54": {
"content": "ka",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"55": {
"content": "kk",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"56": {
"content": "lo",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"57": {
"content": "lt",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"58": {
"content": "lv",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"59": {
"content": "mk",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"60": {
"content": "ml",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"61": {
"content": "mn",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"62": {
"content": "mr",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"63": {
"content": "mt",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"64": {
"content": "no",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"65": {
"content": "ne",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"66": {
"content": "nl",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"67": {
"content": "nn",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"68": {
"content": "oc",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"69": {
"content": "pa",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"70": {
"content": "pl",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"71": {
"content": "ps",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"72": {
"content": "ro",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"73": {
"content": "sd",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"74": {
"content": "sk",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"75": {
"content": "sl",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"76": {
"content": "sq",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"77": {
"content": "sr",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"78": {
"content": "sv",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"79": {
"content": "sw",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"80": {
"content": "ta",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"81": {
"content": "te",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"82": {
"content": "tg",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"83": {
"content": "th",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"84": {
"content": "tk",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"85": {
"content": "tr",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"86": {
"content": "tt",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"87": {
"content": "uk",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"88": {
"content": "ur",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"89": {
"content": "uz",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"90": {
"content": "vi",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"91": {
"content": "yi",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"92": {
"content": "yo",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"93": {
"content": "kn",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"94": {
"content": "so",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"95": {
"content": "ceb",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"96": {
"content": "jw",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"97": {
"content": "mi",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"98": {
"content": "hr",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"99": {
"content": "bs",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"100": {
"content": "tl",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"101": {
"content": "ln",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"102": {
"content": "my",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"103": {
"content": "fi",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"104": {
"content": "sn",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"105": {
"content": "lb",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"106": {
"content": "gu",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"107": {
"content": "ms",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"108": {
"content": "km",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"109": {
"content": "bo",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"110": {
"content": "fo",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"111": {
"content": "gv",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"112": {
"content": "haw",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"113": {
"content": "la",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"114": {
"content": "mg",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"115": {
"content": "sa",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"116": {
"content": "sco",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"117": {
"content": "si",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"118": {
"content": "su",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
},
"119": {
"content": "war",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": false
}
}
}