{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 0, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 1, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 2, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 3, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 4, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 5, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 6, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "BertNormalizer", "clean_text": true, "handle_chinese_chars": true, "strip_accents": null, "lowercase": true }, "pre_tokenizer": { "type": "BertPreTokenizer" }, "post_processor": { "type": "TemplateProcessing", "single": [ { "SpecialToken": { "id": "", "type_id": 2 } }, { "Sequence": { "id": "A", "type_id": 0 } }, { "SpecialToken": { "id": "", "type_id": 0 } } ], "pair": [ { "SpecialToken": { "id": "", "type_id": 2 } }, { "Sequence": { "id": "A", "type_id": 0 } }, { "SpecialToken": { "id": "", "type_id": 0 } }, { "Sequence": { "id": "B", "type_id": 1 } }, { "SpecialToken": { "id": "", "type_id": 1 } } ], "special_tokens": { "": { "id": "", "ids": [ 4 ], "tokens": [ "" ] }, "": { "id": "", "ids": [ 5 ], "tokens": [ "" ] } } }, "decoder": { "type": "WordPiece", "prefix": "##", "cleanup": true }, "model": { "type": "WordPiece", "unk_token": "", "continuing_subword_prefix": "##", "max_input_chars_per_word": 100, "vocab": { "": 0, "": 1, "": 2, "": 3, "": 4, "": 5, "": 6, "!": 7, "\"": 8, "#": 9, "$": 10, "%": 11, "&": 12, "'": 13, "(": 14, ")": 15, "*": 16, "+": 17, ",": 18, "-": 19, ".": 20, "/": 21, "0": 22, "1": 23, "2": 24, "3": 25, "4": 26, "5": 27, "6": 28, "7": 29, "8": 30, "9": 31, ":": 32, ";": 33, "<": 34, "=": 35, ">": 36, "?": 37, "@": 38, "[": 39, "\\": 40, "]": 41, "^": 42, "_": 43, "`": 44, "a": 45, "b": 46, "c": 47, "d": 48, "e": 49, "f": 50, "g": 51, "h": 52, "i": 53, "j": 54, "k": 55, "l": 56, "m": 57, "n": 58, "o": 59, "p": 60, "q": 61, "r": 62, "s": 63, "t": 64, "u": 65, "v": 66, "w": 67, "x": 68, "y": 69, "z": 70, "|": 71, "}": 72, "~": 73, "¡": 74, "¢": 75, "£": 76, "¥": 77, "§": 78, "°": 79, "±": 80, "²": 81, "³": 82, "´": 83, "µ": 84, "·": 85, "º": 86, "½": 87, "¿": 88, "×": 89, "ß": 90, "æ": 91, "ð": 92, "ø": 93, "þ": 94, "đ": 95, "ħ": 96, "ı": 97, "ł": 98, "œ": 99, "ɐ": 100, "ɑ": 101, "ɒ": 102, "ɔ": 103, "ə": 104, "ɛ": 105, "ɜ": 106, "ɡ": 107, "ɢ": 108, "ɪ": 109, "ɫ": 110, "ɳ": 111, "ɽ": 112, "ɾ": 113, "ʁ": 114, "ʃ": 115, "ʊ": 116, "ʋ": 117, "ʒ": 118, "ʔ": 119, "ʕ": 120, "ʲ": 121, "ʻ": 122, "ʼ": 123, "ʾ": 124, "ʿ": 125, "ˈ": 126, "ˌ": 127, "ː": 128, "α": 129, "β": 130, "γ": 131, "δ": 132, "ε": 133, "η": 134, "θ": 135, "ι": 136, "κ": 137, "λ": 138, "μ": 139, "ν": 140, "ξ": 141, "ο": 142, "π": 143, "ρ": 144, "ς": 145, "σ": 146, "τ": 147, "υ": 148, "φ": 149, "χ": 150, "ψ": 151, "ω": 152, "а": 153, "б": 154, "в": 155, "г": 156, "д": 157, "е": 158, "ж": 159, "з": 160, "и": 161, "к": 162, "л": 163, "м": 164, "н": 165, "о": 166, "п": 167, "р": 168, "с": 169, "т": 170, "у": 171, "х": 172, "ц": 173, "ш": 174, "ъ": 175, "ы": 176, "ь": 177, "ю": 178, "я": 179, "є": 180, "א": 181, "ב": 182, "ג": 183, "ה": 184, "ו": 185, "ז": 186, "ח": 187, "י": 188, "ל": 189, "ם": 190, "מ": 191, "ן": 192, "נ": 193, "ס": 194, "ף": 195, "פ": 196, "צ": 197, "ר": 198, "ש": 199, "ת": 200, "ء": 201, "ا": 202, "ب": 203, "ة": 204, "ت": 205, "ث": 206, "ج": 207, "ح": 208, "خ": 209, "د": 210, "ذ": 211, "ر": 212, "س": 213, "ش": 214, "ص": 215, "ع": 216, "ف": 217, "ق": 218, "ك": 219, "ل": 220, "م": 221, "ن": 222, "ه": 223, "و": 224, "ي": 225, "ܐ": 226, "ܕ": 227, "ܗ": 228, "ܝ": 229, "ܠ": 230, "ܢ": 231, "ܬ": 232, "अ": 233, "ई": 234, "क": 235, "ग": 236, "ण": 237, "त": 238, "द": 239, "न": 240, "प": 241, "ब": 242, "म": 243, "य": 244, "र": 245, "ल": 246, "व": 247, "स": 248, "ह": 249, "ा": 250, "ि": 251, "আ": 252, "ল": 253, "হ": 254, "া": 255, "ਅ": 256, "ਲ": 257, "ਹ": 258, "ਾ": 259, "അ": 260, "ള": 261, "ഹ": 262, "ാ": 263, "ก": 264, "ค": 265, "ง": 266, "ช": 267, "ซ": 268, "ญ": 269, "ฐ": 270, "ณ": 271, "ด": 272, "ต": 273, "น": 274, "บ": 275, "ป": 276, "พ": 277, "ภ": 278, "ม": 279, "ย": 280, "ร": 281, "ล": 282, "ว": 283, "ศ": 284, "ษ": 285, "ส": 286, "ห": 287, "อ": 288, "ฮ": 289, "ะ": 290, "า": 291, "เ": 292, "แ": 293, "ไ": 294, "ა": 295, "ბ": 296, "გ": 297, "დ": 298, "ე": 299, "ვ": 300, "ზ": 301, "თ": 302, "ი": 303, "კ": 304, "ლ": 305, "მ": 306, "ნ": 307, "ო": 308, "პ": 309, "ჟ": 310, "რ": 311, "ს": 312, "ტ": 313, "უ": 314, "ფ": 315, "ქ": 316, "ღ": 317, "ყ": 318, "შ": 319, "ჩ": 320, "ც": 321, "ძ": 322, "წ": 323, "ჭ": 324, "ხ": 325, "ჯ": 326, "ჰ": 327, "ჱ": 328, "ჲ": 329, "ჳ": 330, "ჴ": 331, "ჵ": 332, "ჶ": 333, "ჷ": 334, "ჸ": 335, "ჹ": 336, "ჺ": 337, "჻": 338, "ᄃ": 339, "ᄅ": 340, "ᄇ": 341, "ᄋ": 342, "ᄌ": 343, "ᅡ": 344, "ᅢ": 345, "ᅦ": 346, "ᅧ": 347, "ᅩ": 348, "ᅮ": 349, "ᅵ": 350, "ᆨ": 351, "ᆫ": 352, "ᆯ": 353, "ᆸ": 354, "ᆼ": 355, "ᵻ": 356, "‐": 357, "‑": 358, "–": 359, "—": 360, "―": 361, "‘": 362, "’": 363, "“": 364, "”": 365, "„": 366, "†": 367, "‡": 368, "•": 369, "…": 370, "′": 371, "″": 372, "⁄": 373, "₣": 374, "₤": 375, "€": 376, "₹": 377, "⅓": 378, "⅔": 379, "→": 380, "−": 381, "≡": 382, "≤": 383, "①": 384, "☉": 385, "☫": 386, "♀": 387, "♭": 388, "♯": 389, "⚳": 390, "ⴀ": 391, "ⴂ": 392, "ⴃ": 393, "ⴈ": 394, "ⴌ": 395, "ⴕ": 396, "ⴟ": 397, "〈": 398, "〉": 399, "〜": 400, "あ": 401, "い": 402, "う": 403, "お": 404, "か": 405, "き": 406, "く": 407, "け": 408, "こ": 409, "さ": 410, "し": 411, "す": 412, "せ": 413, "た": 414, "ち": 415, "っ": 416, "つ": 417, "と": 418, "な": 419, "に": 420, "の": 421, "は": 422, "ひ": 423, "ふ": 424, "ほ": 425, "ま": 426, "み": 427, "め": 428, "も": 429, "ゃ": 430, "ゆ": 431, "ょ": 432, "ら": 433, "り": 434, "る": 435, "れ": 436, "わ": 437, "を": 438, "ん": 439, "ァ": 440, "ア": 441, "ィ": 442, "イ": 443, "ゥ": 444, "ウ": 445, "ェ": 446, "エ": 447, "ォ": 448, "オ": 449, "カ": 450, "キ": 451, "ク": 452, "ケ": 453, "コ": 454, "サ": 455, "シ": 456, "ス": 457, "セ": 458, "タ": 459, "チ": 460, "ッ": 461, "ツ": 462, "テ": 463, "ト": 464, "ナ": 465, "ニ": 466, "ネ": 467, "ノ": 468, "ハ": 469, "フ": 470, "ヘ": 471, "マ": 472, "ミ": 473, "ム": 474, "モ": 475, "ャ": 476, "ュ": 477, "ョ": 478, "ラ": 479, "リ": 480, "ル": 481, "レ": 482, "ロ": 483, "ン": 484, "・": 485, "ー": 486, "一": 487, "七": 488, "下": 489, "世": 490, "丙": 491, "中": 492, "主": 493, "乃": 494, "之": 495, "乙": 496, "九": 497, "二": 498, "云": 499, "人": 500, "今": 501, "付": 502, "作": 503, "侗": 504, "依": 505, "信": 506, "傳": 507, "儚": 508, "充": 509, "光": 510, "全": 511, "兵": 512, "其": 513, "具": 514, "円": 515, "再": 516, "出": 517, "判": 518, "前": 519, "剛": 520, "劇": 521, "劉": 522, "動": 523, "化": 524, "北": 525, "华": 526, "厂": 527, "去": 528, "古": 529, "可": 530, "台": 531, "史": 532, "同": 533, "名": 534, "君": 535, "吳": 536, "周": 537, "命": 538, "和": 539, "咲": 540, "善": 541, "四": 542, "國": 543, "園": 544, "圣": 545, "在": 546, "坂": 547, "堤": 548, "場": 549, "塘": 550, "夕": 551, "大": 552, "天": 553, "夫": 554, "女": 555, "妙": 556, "姚": 557, "子": 558, "孟": 559, "守": 560, "安": 561, "宋": 562, "完": 563, "宗": 564, "宝": 565, "宫": 566, "寝": 567, "寺": 568, "小": 569, "少": 570, "尾": 571, "山": 572, "岳": 573, "川": 574, "州": 575, "巳": 576, "市": 577, "師": 578, "平": 579, "广": 580, "庆": 581, "府": 582, "座": 583, "廬": 584, "建": 585, "式": 586, "張": 587, "彌": 588, "彩": 589, "彼": 590, "後": 591, "御": 592, "德": 593, "思": 594, "愛": 595, "憑": 596, "憶": 597, "應": 598, "懷": 599, "战": 600, "戦": 601, "扈": 602, "技": 603, "拉": 604, "拳": 605, "挑": 606, "揺": 607, "攻": 608, "放": 609, "政": 610, "散": 611, "斯": 612, "方": 613, "日": 614, "旦": 615, "旭": 616, "昌": 617, "明": 618, "星": 619, "春": 620, "晋": 621, "景": 622, "曦": 623, "月": 624, "望": 625, "未": 626, "本": 627, "李": 628, "村": 629, "杜": 630, "束": 631, "来": 632, "林": 633, "桜": 634, "梶": 635, "棘": 636, "椎": 637, "楊": 638, "楚": 639, "榮": 640, "橘": 641, "機": 642, "正": 643, "殻": 644, "殿": 645, "母": 646, "水": 647, "汉": 648, "沂": 649, "沙": 650, "河": 651, "泗": 652, "波": 653, "泣": 654, "洪": 655, "淹": 656, "清": 657, "湯": 658, "漢": 659, "澄": 660, "澤": 661, "火": 662, "灯": 663, "灵": 664, "灼": 665, "焼": 666, "熱": 667, "物": 668, "狐": 669, "狸": 670, "玄": 671, "王": 672, "玩": 673, "珂": 674, "珙": 675, "球": 676, "理": 677, "琦": 678, "琪": 679, "瓊": 680, "生": 681, "田": 682, "畢": 683, "番": 684, "瘡": 685, "白": 686, "皮": 687, "真": 688, "砲": 689, "礮": 690, "祈": 691, "神": 692, "祠": 693, "秋": 694, "空": 695, "立": 696, "精": 697, "約": 698, "絵": 699, "織": 700, "義": 701, "翠": 702, "者": 703, "耕": 704, "肖": 705, "胡": 706, "膀": 707, "臂": 708, "興": 709, "良": 710, "花": 711, "芳": 712, "芽": 713, "若": 714, "英": 715, "藕": 716, "藥": 717, "蘄": 718, "蘇": 719, "行": 720, "裁": 721, "規": 722, "覺": 723, "观": 724, "解": 725, "記": 726, "誓": 727, "誡": 728, "誰": 729, "謎": 730, "许": 731, "谭": 732, "豪": 733, "豫": 734, "費": 735, "贵": 736, "赤": 737, "趙": 738, "足": 739, "跡": 740, "転": 741, "辛": 742, "逆": 743, "遇": 744, "運": 745, "過": 746, "遠": 747, "選": 748, "邦": 749, "邱": 750, "部": 751, "郭": 752, "都": 753, "酈": 754, "里": 755, "野": 756, "金": 757, "銃": 758, "鋼": 759, "錄": 760, "錡": 761, "鍵": 762, "鐵": 763, "钱": 764, "铁": 765, "關": 766, "防": 767, "阿": 768, "陈": 769, "陳": 770, "陽": 771, "隊": 772, "階": 773, "集": 774, "雪": 775, "雲": 776, "霖": 777, "霹": 778, "靂": 779, "韓": 780, "願": 781, "顯": 782, "颜": 783, "马": 784, "高": 785, "龍": 786, "ﷲ": 787, "ﻋ": 788, "/": 789, "3": 790, "~": 791, "##o": 792, "##m": 793, "##g": 794, "##e": 795, "##n": 796, "##i": 797, "##t": 798, "##y": 799, "##l": 800, "##d": 801, "##s": 802, "##r": 803, "##w": 804, "##a": 805, "##c": 806, "##u": 807, "##k": 808, "##f": 809, "##b": 810, "##h": 811, "##v": 812, "##5": 813, "##ォ": 814, "##ル": 815, "##ト": 816, "##ゥ": 817, "##ナ": 818, "##j": 819, "##p": 820, "##2": 821, "##7": 822, "##z": 823, "##q": 824, "##x": 825, "##4": 826, "##9": 827, "##6": 828, "##3": 829, "##0": 830, "##8": 831, "##ל": 832, "##ו": 833, "##ה": 834, "##1": 835, "##ł": 836, "##р": 837, "##е": 838, "##м": 839, "##а": 840, "##ภ": 841, "##า": 842, "##ด": 843, "##ο": 844, "##ρ": 845, "##υ": 846, "##ς": 847, "##た": 848, "##し": 849, "##の": 850, "##す": 851, "##き": 852, "##な": 853, "##ひ": 854, "##と": 855, "##ე": 856, "##ლ": 857, "##მ": 858, "##წ": 859, "##ი": 860, "##ფ": 861, "##ε": 862, "##ν": 863, "##ل": 864, "##ر": 865, "##و": 866, "##ح": 867, "##ø": 868, "##უ": 869, "##ც": 870, "##ს": 871, "##т": 872, "##и": 873, "##ш": 874, "##с": 875, "##к": 876, "##ا": 877, "##ك": 878, "##د": 879, "##ਲ": 880, "##ਹ": 881, "##ق": 882, "##ي": 883, "##ش": 884, "##ı": 885, "##н": 886, "##ы": 887, "##ा": 888, "##न": 889, "##ई": 890, "##ɒ": 891, "##ə": 892, "##ਾ": 893, "##ɪ": 894, "##ʊ": 895, "##ˌ": 896, "##ː": 897, "##ء": 898, "##ع": 899, "##ب": 900, "##æ": 901, "##ɡ": 902, "##ण": 903, "##र": 904, "##ɑ": 905, "##ウ": 906, "##ァ": 907, "##キ": 908, "##ュ": 909, "##リ": 910, "##ア": 911, "##3": 912, "##ᵻ": 913, "##ʻ": 914, "##も": 915, "##ъ": 916, "##в": 917, "##م": 918, "##ن": 919, "##ク": 920, "##サ": 921, "##ス": 922, "##ッ": 923, "##ラ": 924, "##ー": 925, "##о": 926, "##л": 927, "##ˈ": 928, "##ɳ": 929, "##व": 930, "##ह": 931, "##ि": 932, "##क": 933, "##ᅡ": 934, "##ᆯ": 935, "##ᄅ": 936, "##α": 937, "##め": 938, "##พ": 939, "##แ": 940, "##ก": 941, "##β": 942, "##ɽ": 943, "##у": 944, "##я": 945, "##ɛ": 946, "##ხ": 947, "##რ": 948, "##レ": 949, "##イ": 950, "##ン": 951, "##θ": 952, "##ɔ": 953, "##פ": 954, "##ث": 955, "##י": 956, "##ო": 957, "##γ": 958, "##は": 959, "##り": 960, "##あ": 961, "##ん": 962, "##ם": 963, "##ω": 964, "##シ": 965, "##đ": 966, "##ю": 967, "##з": 968, "##ɾ": 969, "##п": 970, "##д": 971, "##ल": 972, "##い": 973, "##ه": 974, "##º": 975, "##ร": 976, "##ж": 977, "##द": 978, "##フ": 979, "##タ": 980, "##ქ": 981, "##ა": 982, "##ნ": 983, "##დ": 984, "##っ": 985, "##ょ": 986, "##に": 987, "##テ": 988, "##ィ": 989, "##ニ": 990, "##ะ": 991, "##ช": 992, "##อ": 993, "##น": 994, "##ვ": 995, "##マ": 996, "##お": 997, "##χ": 998, "##π": 999, "##τ": 1000, "##ι": 1001, "##κ": 1002, "##σ": 1003, "##г": 1004, "##ت": 1005, "##セ": 1006, "##オ": 1007, "##μ": 1008, "##ค": 1009, "##ว": 1010, "##ต": 1011, "##ロ": 1012, "##გ": 1013, "##ʃ": 1014, "##ב": 1015, "##ת": 1016, "##א": 1017, "##ミ": 1018, "##か": 1019, "##こ": 1020, "##く": 1021, "##れ": 1022, "##ʔ": 1023, "##δ": 1024, "##ة": 1025, "##ʁ": 1026, "##ハ": 1027, "##ש": 1028, "##מ": 1029, "##צ": 1030, "##ള": 1031, "##ჲ": 1032, "##ף": 1033, "##う": 1034, "##ð": 1035, "##თ": 1036, "##ᄇ": 1037, "##ᅮ": 1038, "##ᄃ": 1039, "##ᅢ": 1040, "##া": 1041, "##হ": 1042, "##ネ": 1043, "##ョ": 1044, "##る": 1045, "##ʲ": 1046, "##س": 1047, "##み": 1048, "##є": 1049, "##λ": 1050, "##チ": 1051, "##ら": 1052, "##ム": 1053, "##ェ": 1054, "##ล": 1055, "##ย": 1056, "##ณ": 1057, "##ม": 1058, "##ص": 1059, "##ɫ": 1060, "##ป": 1061, "##ß": 1062, "##ف": 1063, "##わ": 1064, "##ʿ": 1065, "##ツ": 1066, "##ܠ": 1067, "##ܗ": 1068, "##ܐ": 1069, "##ノ": 1070, "##ן": 1071, "##ল": 1072, "##ま": 1073, "##ტ": 1074, "##ჱ": 1075, "##ฮ": 1076, "##ξ": 1077, "##เ": 1078, "##ാ": 1079, "##ഹ": 1080, "##ɐ": 1081, "##ჳ": 1082, "##ゆ": 1083, "##ग": 1084, "##カ": 1085, "##ซ": 1086, "##ャ": 1087, "##モ": 1088, "##خ": 1089, "##ᅦ": 1090, "##ᅩ": 1091, "##ᆨ": 1092, "##ᅵ": 1093, "##ᆸ": 1094, "##ᅧ": 1095, "##ᆼ": 1096, "##ᄋ": 1097, "##ᆫ": 1098, "##つ": 1099, "##せ": 1100, "##ס": 1101, "##η": 1102, "##х": 1103, "##ง": 1104, "##ไ": 1105, "##ц": 1106, "##ь": 1107, "##ψ": 1108, "##ʒ": 1109, "##נ": 1110, "##ち": 1111, "##ゃ": 1112, "##ר": 1113, "##œ": 1114, "##ܕ": 1115, "##ܝ": 1116, "##ܢ": 1117, "##ܬ": 1118, "##ذ": 1119, "##ษ": 1120, "##ฐ": 1121, "##を": 1122, "##ɜ": 1123, "##स": 1124, "##エ": 1125 } } }