Sheikh-ABF / tokenizer.json
likhonsheikh's picture
Upload merged LoRA model and tokenizer
3445b9d verified
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [
{
"id": 0,
"content": "<bos>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 1,
"content": "<eos>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 2,
"content": "<pad>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 405,
"content": "<unk>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "ByteLevel",
"add_prefix_space": false,
"trim_offsets": true,
"use_regex": true
},
"post_processor": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": false,
"use_regex": true
},
"decoder": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": true,
"use_regex": true
},
"model": {
"type": "BPE",
"dropout": null,
"unk_token": null,
"continuing_subword_prefix": "",
"end_of_word_suffix": "",
"fuse_unk": false,
"byte_fallback": false,
"ignore_merges": false,
"vocab": {
"<bos>": 0,
"<eos>": 1,
"<pad>": 2,
"<think>": 3,
"</think>": 4,
"!": 5,
"\"": 6,
"#": 7,
"$": 8,
"%": 9,
"&": 10,
"'": 11,
"(": 12,
")": 13,
"*": 14,
"+": 15,
",": 16,
"-": 17,
".": 18,
"/": 19,
"0": 20,
"1": 21,
"2": 22,
"3": 23,
"4": 24,
"5": 25,
"6": 26,
"7": 27,
"8": 28,
"9": 29,
":": 30,
";": 31,
"<": 32,
"=": 33,
">": 34,
"?": 35,
"@": 36,
"A": 37,
"B": 38,
"C": 39,
"D": 40,
"E": 41,
"F": 42,
"G": 43,
"H": 44,
"I": 45,
"J": 46,
"K": 47,
"L": 48,
"M": 49,
"N": 50,
"O": 51,
"P": 52,
"Q": 53,
"R": 54,
"S": 55,
"T": 56,
"U": 57,
"V": 58,
"W": 59,
"X": 60,
"Y": 61,
"Z": 62,
"[": 63,
"\\": 64,
"]": 65,
"^": 66,
"_": 67,
"`": 68,
"a": 69,
"b": 70,
"c": 71,
"d": 72,
"e": 73,
"f": 74,
"g": 75,
"h": 76,
"i": 77,
"j": 78,
"k": 79,
"l": 80,
"m": 81,
"n": 82,
"o": 83,
"p": 84,
"q": 85,
"r": 86,
"s": 87,
"t": 88,
"u": 89,
"v": 90,
"w": 91,
"x": 92,
"y": 93,
"z": 94,
"{": 95,
"|": 96,
"}": 97,
"~": 98,
"¡": 99,
"¢": 100,
"£": 101,
"¤": 102,
"¥": 103,
"¦": 104,
"§": 105,
"¨": 106,
"©": 107,
"ª": 108,
"«": 109,
"¬": 110,
"®": 111,
"¯": 112,
"°": 113,
"±": 114,
"²": 115,
"³": 116,
"´": 117,
"µ": 118,
"¶": 119,
"·": 120,
"¸": 121,
"¹": 122,
"º": 123,
"»": 124,
"¼": 125,
"½": 126,
"¾": 127,
"¿": 128,
"À": 129,
"Á": 130,
"Â": 131,
"Ã": 132,
"Ä": 133,
"Å": 134,
"Æ": 135,
"Ç": 136,
"È": 137,
"É": 138,
"Ê": 139,
"Ë": 140,
"Ì": 141,
"Í": 142,
"Î": 143,
"Ï": 144,
"Ð": 145,
"Ñ": 146,
"Ò": 147,
"Ó": 148,
"Ô": 149,
"Õ": 150,
"Ö": 151,
"×": 152,
"Ø": 153,
"Ù": 154,
"Ú": 155,
"Û": 156,
"Ü": 157,
"Ý": 158,
"Þ": 159,
"ß": 160,
"à": 161,
"á": 162,
"â": 163,
"ã": 164,
"ä": 165,
"å": 166,
"æ": 167,
"ç": 168,
"è": 169,
"é": 170,
"ê": 171,
"ë": 172,
"ì": 173,
"í": 174,
"î": 175,
"ï": 176,
"ð": 177,
"ñ": 178,
"ò": 179,
"ó": 180,
"ô": 181,
"õ": 182,
"ö": 183,
"÷": 184,
"ø": 185,
"ù": 186,
"ú": 187,
"û": 188,
"ü": 189,
"ý": 190,
"þ": 191,
"ÿ": 192,
"Ā": 193,
"ā": 194,
"Ă": 195,
"ă": 196,
"Ą": 197,
"ą": 198,
"Ć": 199,
"ć": 200,
"Ĉ": 201,
"ĉ": 202,
"Ċ": 203,
"ċ": 204,
"Č": 205,
"č": 206,
"Ď": 207,
"ď": 208,
"Đ": 209,
"đ": 210,
"Ē": 211,
"ē": 212,
"Ĕ": 213,
"ĕ": 214,
"Ė": 215,
"ė": 216,
"Ę": 217,
"ę": 218,
"Ě": 219,
"ě": 220,
"Ĝ": 221,
"ĝ": 222,
"Ğ": 223,
"ğ": 224,
"Ġ": 225,
"ġ": 226,
"Ģ": 227,
"ģ": 228,
"Ĥ": 229,
"ĥ": 230,
"Ħ": 231,
"ħ": 232,
"Ĩ": 233,
"ĩ": 234,
"Ī": 235,
"ī": 236,
"Ĭ": 237,
"ĭ": 238,
"Į": 239,
"į": 240,
"İ": 241,
"ı": 242,
"IJ": 243,
"ij": 244,
"Ĵ": 245,
"ĵ": 246,
"Ķ": 247,
"ķ": 248,
"ĸ": 249,
"Ĺ": 250,
"ĺ": 251,
"Ļ": 252,
"ļ": 253,
"Ľ": 254,
"ľ": 255,
"Ŀ": 256,
"ŀ": 257,
"Ł": 258,
"ł": 259,
"Ń": 260,
"à¦": 261,
"à§": 262,
"Ġà¦": 263,
"া": 264,
"র": 265,
"à§ĩ": 266,
"à§į": 267,
"ি": 268,
"ন": 269,
"ত": 270,
"ল": 271,
"য": 272,
"ব": 273,
"à¦ķ": 274,
"¥¤": 275,
"।": 276,
"দ": 277,
"়": 278,
"ম": 279,
"à§ģ": 280,
"Ġস": 281,
"শ": 282,
"Ġà¦ķ": 283,
"Ġব": 284,
"Ġপ": 285,
"à§Ģ": 286,
"স": 287,
"à¦Ĥ": 288,
"প": 289,
"Ġà¦ı": 290,
"হ": 291,
"à¦Ł": 292,
"Ġà¦Ĩ": 293,
"Ġà¦ķর": 294,
"ড": 295,
"ণ": 296,
"Ġà¦ħ": 297,
"ধ": 298,
"à§ĭ": 299,
"াà¦Ĥ": 300,
"à¦ľ": 301,
"Ġà¦ī": 302,
"hi": 303,
"nk": 304,
"thi": 305,
"ষ": 306,
"à¦Ľ": 307,
"Ġন": 308,
"Ġম": 309,
"à§ĩ।": 310,
"think": 311,
"Ġà¦ľ": 312,
"à¦Ĺ": 313,
"à¦ļ": 314,
"Ġত": 315,
"Ġদ": 316,
"Ġহ": 317,
"থ": 318,
"à¦ĩ": 319,
"à¦Ń": 320,
"à§ĥ": 321,
"Ġà¦ıà¦ķ": 322,
"à¦ĸ": 323,
"à¦ł": 324,
"à§Ĥ": 325,
"Ġà¦ĵ": 326,
"রণ": 327,
"Ġà¦Ĩম": 328,
"Ġà¦ħন": 329,
"</": 330,
"Ġফ": 331,
"Ġর": 332,
"Ġশ": 333,
"়া": 334,
"Ġসà¦ķ": 335,
"Ġ'": 336,
"ফ": 337,
"à¦Ĩ": 338,
"Ġà¦Ĺ": 339,
"Ġà¦ļ": 340,
"Ġà¦Ń": 341,
"।</": 342,
"়à§ĩ": 343,
"়ি": 344,
"Ġপর": 345,
"Ġà¦ıব": 346,
"Ġহয": 347,
"Ġà¦ıà¦ķà¦Ł": 348,
"Ġ<": 349,
"à¦ı": 350,
"à§Į": 351,
"Ġয": 352,
"ি?": 353,
"যব": 354,
"দর": 355,
"Ġসম": 356,
"পর": 357,
"পন": 358,
"Ġà¦ıà¦ĩ": 359,
"Ġà¦Ĩপন": 360,
"à¦ľà¦¨": 361,
"Ġà¦īà¦ļ": 362,
"Ġহব": 363,
"à¦ĸত": 364,
"Ġà¦ĵà¦ł": 365,
"à¦Ĩম": 366,
"?'": 367,
"ĠA": 368,
"ĠB": 369,
"à¦ģ": 370,
"à¦ħ": 371,
"à¦Ļ": 372,
"Ġধ": 373,
"Ġà¦Ł": 374,
"া।": 375,
"রত": 376,
"রয": 377,
"রশ": 378,
"রহ": 379,
"à§ĩ?": 380,
"ি।": 381,
"তর": 382,
"তà¦ı": 383,
"লন": 384,
"à¦¯à¦Ł": 385,
"়।": 386,
"Ġসত": 387,
"Ġবল": 388,
"সব": 389,
"Ġà¦ıà¦Ł": 390,
"হল": 391,
"Ġà¦Ĩà¦Ľ": 392,
"Ġà¦Ĩà¦Ĺ": 393,
"ধন": 394,
"à¦ľà¦§": 395,
"Ġà¦īড": 396,
"Ġমরণ": 397,
"Ġà¦ľà¦¨": 398,
"Ġতথ": 399,
"Ġফল": 400,
"Ġসà¦ķল": 401,
"ফল": 402,
"তà¦ıব": 403,
"Ġমরণশ": 404
},
"merges": [
[
"à",
"¦"
],
[
"à",
"§"
],
[
"Ġ",
"à¦"
],
[
"à¦",
"¾"
],
[
"à¦",
"°"
],
[
"à§",
"ĩ"
],
[
"à§",
"į"
],
[
"à¦",
"¿"
],
[
"à¦",
"¨"
],
[
"à¦",
"¤"
],
[
"à¦",
"²"
],
[
"à¦",
"¯"
],
[
"à¦",
"¬"
],
[
"à¦",
"ķ"
],
[
"¥",
"¤"
],
[
"à",
"¥¤"
],
[
"à¦",
"¦"
],
[
"à¦",
"¼"
],
[
"à¦",
"®"
],
[
"à§",
"ģ"
],
[
"Ġà¦",
"¸"
],
[
"à¦",
"¶"
],
[
"Ġà¦",
"ķ"
],
[
"Ġà¦",
"¬"
],
[
"Ġà¦",
"ª"
],
[
"à§",
"Ģ"
],
[
"à¦",
"¸"
],
[
"à¦",
"Ĥ"
],
[
"à¦",
"ª"
],
[
"Ġà¦",
"ı"
],
[
"à¦",
"¹"
],
[
"à¦",
"Ł"
],
[
"Ġà¦",
"Ĩ"
],
[
"Ġà¦ķ",
"র"
],
[
"à¦",
"¡"
],
[
"à¦",
"£"
],
[
"Ġà¦",
"ħ"
],
[
"à¦",
"§"
],
[
"à§",
"ĭ"
],
[
"া",
"à¦Ĥ"
],
[
"à¦",
"ľ"
],
[
"Ġà¦",
"ī"
],
[
"h",
"i"
],
[
"n",
"k"
],
[
"t",
"hi"
],
[
"à¦",
"·"
],
[
"à¦",
"Ľ"
],
[
"Ġà¦",
"¨"
],
[
"Ġà¦",
"®"
],
[
"à§ĩ",
"।"
],
[
"thi",
"nk"
],
[
"Ġà¦",
"ľ"
],
[
"à¦",
"Ĺ"
],
[
"à¦",
"ļ"
],
[
"Ġà¦",
"¤"
],
[
"Ġà¦",
"¦"
],
[
"Ġà¦",
"¹"
],
[
"à¦",
"¥"
],
[
"à¦",
"ĩ"
],
[
"à¦",
"Ń"
],
[
"à§",
"ĥ"
],
[
"Ġà¦ı",
"à¦ķ"
],
[
"à¦",
"ĸ"
],
[
"à¦",
"ł"
],
[
"à§",
"Ĥ"
],
[
"Ġà¦",
"ĵ"
],
[
"র",
"ণ"
],
[
"Ġà¦Ĩ",
"ম"
],
[
"Ġà¦ħ",
"ন"
],
[
"<",
"/"
],
[
"Ġà¦",
"«"
],
[
"Ġà¦",
"°"
],
[
"Ġà¦",
"¶"
],
[
"়",
"া"
],
[
"Ġস",
"à¦ķ"
],
[
"Ġ",
"'"
],
[
"à¦",
"«"
],
[
"à¦",
"Ĩ"
],
[
"Ġà¦",
"Ĺ"
],
[
"Ġà¦",
"ļ"
],
[
"Ġà¦",
"Ń"
],
[
"।",
"</"
],
[
"়",
"à§ĩ"
],
[
"়",
"ি"
],
[
"Ġপ",
"র"
],
[
"Ġà¦ı",
"ব"
],
[
"Ġহ",
"য"
],
[
"Ġà¦ıà¦ķ",
"à¦Ł"
],
[
"Ġ",
"<"
],
[
"à¦",
"ı"
],
[
"à§",
"Į"
],
[
"Ġà¦",
"¯"
],
[
"ি",
"?"
],
[
"য",
"ব"
],
[
"দ",
"র"
],
[
"Ġস",
"ম"
],
[
"প",
"র"
],
[
"প",
"ন"
],
[
"Ġà¦ı",
"à¦ĩ"
],
[
"Ġà¦Ĩ",
"পন"
],
[
"à¦ľ",
"ন"
],
[
"Ġà¦ī",
"à¦ļ"
],
[
"Ġহ",
"ব"
],
[
"à¦ĸ",
"ত"
],
[
"Ġà¦ĵ",
"à¦ł"
],
[
"à¦Ĩ",
"ম"
],
[
"?",
"'"
],
[
"Ġ",
"A"
],
[
"Ġ",
"B"
],
[
"à¦",
"ģ"
],
[
"à¦",
"ħ"
],
[
"à¦",
"Ļ"
],
[
"Ġà¦",
"§"
],
[
"Ġà¦",
"Ł"
],
[
"া",
"।"
],
[
"র",
"ত"
],
[
"র",
"য"
],
[
"র",
"শ"
],
[
"র",
"হ"
],
[
"à§ĩ",
"?"
],
[
"ি",
"।"
],
[
"ত",
"র"
],
[
"ত",
"à¦ı"
],
[
"ল",
"ন"
],
[
"য",
"à¦Ł"
],
[
"়",
"।"
],
[
"Ġস",
"ত"
],
[
"Ġব",
"ল"
],
[
"স",
"ব"
],
[
"Ġà¦ı",
"à¦Ł"
],
[
"হ",
"ল"
],
[
"Ġà¦Ĩ",
"à¦Ľ"
],
[
"Ġà¦Ĩ",
"à¦Ĺ"
],
[
"ধ",
"ন"
],
[
"à¦ľ",
"ধ"
],
[
"Ġà¦ī",
"ড"
],
[
"Ġম",
"রণ"
],
[
"Ġà¦ľ",
"ন"
],
[
"Ġত",
"থ"
],
[
"Ġফ",
"ল"
],
[
"Ġসà¦ķ",
"ল"
],
[
"ফ",
"ল"
],
[
"তà¦ı",
"ব"
],
[
"Ġমরণ",
"শ"
]
]
}
}