| { | |
| "version": "1.0", | |
| "truncation": null, | |
| "padding": null, | |
| "added_tokens": [ | |
| { | |
| "id": 0, | |
| "content": "<|bos|>", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 1, | |
| "content": "<|cond|>", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 2, | |
| "content": "<|sep|>", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 3, | |
| "content": "<|eos|>", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 4, | |
| "content": "[UNK]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| } | |
| ], | |
| "normalizer": { | |
| "type": "Sequence", | |
| "normalizers": [ | |
| { | |
| "type": "Replace", | |
| "pattern": { | |
| "Regex": "=" | |
| }, | |
| "content": " = " | |
| }, | |
| { | |
| "type": "Replace", | |
| "pattern": { | |
| "Regex": "(?<=[A-Za-z0-9])(?=[A-Z])" | |
| }, | |
| "content": " " | |
| } | |
| ] | |
| }, | |
| "pre_tokenizer": { | |
| "type": "Sequence", | |
| "pretokenizers": [ | |
| { | |
| "type": "Split", | |
| "pattern": { | |
| "String": "\n" | |
| }, | |
| "behavior": "Isolated", | |
| "invert": false | |
| }, | |
| { | |
| "type": "Split", | |
| "pattern": { | |
| "String": " " | |
| }, | |
| "behavior": "Removed", | |
| "invert": false | |
| }, | |
| { | |
| "type": "Digits", | |
| "individual_digits": false | |
| }, | |
| { | |
| "type": "Split", | |
| "pattern": { | |
| "Regex": "\\d{2}|\\d" | |
| }, | |
| "behavior": "Isolated", | |
| "invert": false | |
| } | |
| ] | |
| }, | |
| "post_processor": null, | |
| "decoder": { | |
| "type": "Fuse" | |
| }, | |
| "model": { | |
| "type": "WordLevel", | |
| "vocab": { | |
| "[UNK]": 4, | |
| ".": 5, | |
| "\n": 6, | |
| "00": 7, | |
| "2": 8, | |
| "0": 9, | |
| "4": 10, | |
| "3": 11, | |
| "1": 12, | |
| "10": 13, | |
| "6": 14, | |
| "5": 15, | |
| "11": 16, | |
| "12": 17, | |
| "13": 18, | |
| "14": 19, | |
| "7": 20, | |
| "15": 21, | |
| "16": 22, | |
| "17": 23, | |
| "18": 24, | |
| "8": 25, | |
| "19": 26, | |
| "20": 27, | |
| "9": 28, | |
| "21": 29, | |
| "22": 30, | |
| "23": 31, | |
| "24": 32, | |
| "25": 33, | |
| "26": 34, | |
| "90": 35, | |
| "27": 36, | |
| "28": 37, | |
| "29": 38, | |
| "H": 39, | |
| "30": 40, | |
| "31": 41, | |
| "32": 42, | |
| "33": 43, | |
| "01": 44, | |
| "34": 45, | |
| "S": 46, | |
| "02": 47, | |
| "03": 48, | |
| "35": 49, | |
| "04": 50, | |
| "36": 51, | |
| "37": 52, | |
| "05": 53, | |
| "38": 54, | |
| "06": 55, | |
| "39": 56, | |
| "09": 57, | |
| "95": 58, | |
| "08": 59, | |
| "42": 60, | |
| "07": 61, | |
| "98": 62, | |
| "40": 63, | |
| "93": 64, | |
| "56": 65, | |
| "94": 66, | |
| "71": 67, | |
| "97": 68, | |
| "85": 69, | |
| "91": 70, | |
| "84": 71, | |
| "41": 72, | |
| "60": 73, | |
| "92": 74, | |
| "46": 75, | |
| "55": 76, | |
| "86": 77, | |
| "49": 78, | |
| "53": 79, | |
| "79": 80, | |
| "51": 81, | |
| "43": 82, | |
| "88": 83, | |
| "89": 84, | |
| "48": 85, | |
| "87": 86, | |
| "45": 87, | |
| "54": 88, | |
| "78": 89, | |
| "63": 90, | |
| "66": 91, | |
| "69": 92, | |
| "99": 93, | |
| "57": 94, | |
| "82": 95, | |
| "62": 96, | |
| "96": 97, | |
| "74": 98, | |
| "83": 99, | |
| "47": 100, | |
| "58": 101, | |
| "80": 102, | |
| "65": 103, | |
| "77": 104, | |
| "73": 105, | |
| "68": 106, | |
| "81": 107, | |
| "75": 108, | |
| "59": 109, | |
| "72": 110, | |
| "64": 111, | |
| "61": 112, | |
| "76": 113, | |
| "52": 114, | |
| "70": 115, | |
| "44": 116, | |
| "50": 117, | |
| "67": 118, | |
| "=": 119, | |
| "-": 120, | |
| "Se": 121, | |
| "Al": 122, | |
| "C": 123, | |
| "Te": 124, | |
| "Si": 125, | |
| "Ti": 126, | |
| "P": 127, | |
| "Ga": 128, | |
| "N": 129, | |
| "Pd": 130, | |
| "O": 131, | |
| "Cl": 132, | |
| "Ca": 133, | |
| "Hf": 134, | |
| "As": 135, | |
| "In": 136, | |
| "Pt": 137, | |
| "Ni": 138, | |
| "Na": 139, | |
| "Ge": 140, | |
| "Zn": 141, | |
| "Sn": 142, | |
| "Cu": 143, | |
| "Zr": 144, | |
| "Rh": 145, | |
| "Au": 146, | |
| "Sb": 147, | |
| "Ag": 148, | |
| "V": 149, | |
| "Y": 150, | |
| "K": 151, | |
| "Sc": 152, | |
| "Ta": 153, | |
| "Nb": 154, | |
| "<|bos|>": 155, | |
| "<|cond|>": 156, | |
| "<|eos|>": 157, | |
| "<|sep|>": 158, | |
| "ads": 159, | |
| "bin": 160, | |
| "composition": 161, | |
| "relax": 162, | |
| "target_bin": 163, | |
| "task": 164, | |
| "Sr": 165, | |
| "Mo": 166, | |
| "Co": 167, | |
| "Pb": 168, | |
| "Hg": 169, | |
| "Ru": 170, | |
| "Ir": 171, | |
| "Bi": 172, | |
| "Mn": 173, | |
| "Fe": 174, | |
| "Tl": 175, | |
| "Cd": 176, | |
| "Cr": 177, | |
| "Rb": 178, | |
| "W": 179, | |
| "Re": 180, | |
| "Tc": 181, | |
| "Cs": 182, | |
| "Os": 183, | |
| "B": 184 | |
| }, | |
| "unk_token": "[UNK]" | |
| } | |
| } |