NPComposer-v2 / tokenizer_config.json
ralyn's picture
Training in progress, epoch 1
6079c92 verified
{
"added_tokens_decoder": {
"0": {
"content": "<bos>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"1": {
"content": "<eos>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2": {
"content": "<pad>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"3": {
"content": "<mask>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2361": {
"content": "<unk>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2362": {
"content": "<aromatic_rings_count:0>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2363": {
"content": "<aromatic_rings_count:10>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2364": {
"content": "<aromatic_rings_count:11>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2365": {
"content": "<aromatic_rings_count:12>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2366": {
"content": "<aromatic_rings_count:13>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2367": {
"content": "<aromatic_rings_count:14>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2368": {
"content": "<aromatic_rings_count:15>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2369": {
"content": "<aromatic_rings_count:16>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2370": {
"content": "<aromatic_rings_count:17>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2371": {
"content": "<aromatic_rings_count:18>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2372": {
"content": "<aromatic_rings_count:19>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2373": {
"content": "<aromatic_rings_count:1>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2374": {
"content": "<aromatic_rings_count:20>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2375": {
"content": "<aromatic_rings_count:22>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2376": {
"content": "<aromatic_rings_count:2>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2377": {
"content": "<aromatic_rings_count:3>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2378": {
"content": "<aromatic_rings_count:4>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2379": {
"content": "<aromatic_rings_count:5>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2380": {
"content": "<aromatic_rings_count:6>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2381": {
"content": "<aromatic_rings_count:7>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2382": {
"content": "<aromatic_rings_count:8>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2383": {
"content": "<aromatic_rings_count:9>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2384": {
"content": "<np_classifier_is_glycoside:False>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2385": {
"content": "<np_classifier_is_glycoside:True>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2386": {
"content": "<np_classifier_pathway:Alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2387": {
"content": "<np_classifier_pathway:Amino acids and Peptides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2388": {
"content": "<np_classifier_pathway:Carbohydrates>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2389": {
"content": "<np_classifier_pathway:Fatty acids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2390": {
"content": "<np_classifier_pathway:Polyketides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2391": {
"content": "<np_classifier_pathway:Shikimates and Phenylpropanoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2392": {
"content": "<np_classifier_pathway:Terpenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2393": {
"content": "<np_classifier_superclass:Alkylresorcinols>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2394": {
"content": "<np_classifier_superclass:Amino acid glycosides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2395": {
"content": "<np_classifier_superclass:Aminosugars and aminoglycosides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2396": {
"content": "<np_classifier_superclass:Anthranilic acid alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2397": {
"content": "<np_classifier_superclass:Apocarotenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2398": {
"content": "<np_classifier_superclass:Aromatic polyketides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2399": {
"content": "<np_classifier_superclass:Carotenoids (C40)>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2400": {
"content": "<np_classifier_superclass:Carotenoids (C45)>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2401": {
"content": "<np_classifier_superclass:Carotenoids (C50)>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2402": {
"content": "<np_classifier_superclass:Chromanes>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2403": {
"content": "<np_classifier_superclass:Coumarins>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2404": {
"content": "<np_classifier_superclass:Cyclic polyketides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2405": {
"content": "<np_classifier_superclass:Diarylheptanoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2406": {
"content": "<np_classifier_superclass:Diazotetronic acids and derivatives>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2407": {
"content": "<np_classifier_superclass:Diphenyl ethers (DPEs)>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2408": {
"content": "<np_classifier_superclass:Diterpenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2409": {
"content": "<np_classifier_superclass:Docosanoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2410": {
"content": "<np_classifier_superclass:Eicosanoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2411": {
"content": "<np_classifier_superclass:Fatty Acids and Conjugates>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2412": {
"content": "<np_classifier_superclass:Fatty acyl glycosides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2413": {
"content": "<np_classifier_superclass:Fatty acyls>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2414": {
"content": "<np_classifier_superclass:Fatty amides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2415": {
"content": "<np_classifier_superclass:Fatty esters>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2416": {
"content": "<np_classifier_superclass:Flavonoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2417": {
"content": "<np_classifier_superclass:Fluorenes>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2418": {
"content": "<np_classifier_superclass:Glycerolipids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2419": {
"content": "<np_classifier_superclass:Glycerophospholipids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2420": {
"content": "<np_classifier_superclass:Guanidine alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2421": {
"content": "<np_classifier_superclass:Histidine alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2422": {
"content": "<np_classifier_superclass:Isoflavonoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2423": {
"content": "<np_classifier_superclass:Lignans>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2424": {
"content": "<np_classifier_superclass:Linear polyketides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2425": {
"content": "<np_classifier_superclass:Lysine alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2426": {
"content": "<np_classifier_superclass:Macrolides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2427": {
"content": "<np_classifier_superclass:Meroterpenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2428": {
"content": "<np_classifier_superclass:Miscellaneous alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2429": {
"content": "<np_classifier_superclass:Miscellaneous polyketides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2430": {
"content": "<np_classifier_superclass:Mitomycin derivatives>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2431": {
"content": "<np_classifier_superclass:Monoterpenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2432": {
"content": "<np_classifier_superclass:Mycosporine derivatives>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2433": {
"content": "<np_classifier_superclass:Naphthalenes>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2434": {
"content": "<np_classifier_superclass:Nicotinic acid alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2435": {
"content": "<np_classifier_superclass:Nucleosides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2436": {
"content": "<np_classifier_superclass:Octadecanoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2437": {
"content": "<np_classifier_superclass:Oligopeptides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2438": {
"content": "<np_classifier_superclass:Ornithine alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2439": {
"content": "<np_classifier_superclass:Peptide alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2440": {
"content": "<np_classifier_superclass:Phenanthrenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2441": {
"content": "<np_classifier_superclass:Phenolic acids (C6-C1)>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2442": {
"content": "<np_classifier_superclass:Phenylethanoids (C6-C2)>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2443": {
"content": "<np_classifier_superclass:Phenylpropanoids (C6-C3)>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2444": {
"content": "<np_classifier_superclass:Phloroglucinols>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2445": {
"content": "<np_classifier_superclass:Polycyclic aromatic polyketides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2446": {
"content": "<np_classifier_superclass:Polyethers>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2447": {
"content": "<np_classifier_superclass:Polyols>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2448": {
"content": "<np_classifier_superclass:Polyprenols>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2449": {
"content": "<np_classifier_superclass:Proline alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2450": {
"content": "<np_classifier_superclass:Pseudoalkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2451": {
"content": "<np_classifier_superclass:Saccharides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2452": {
"content": "<np_classifier_superclass:Serine alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2453": {
"content": "<np_classifier_superclass:Sesquiterpenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2454": {
"content": "<np_classifier_superclass:Sesterterpenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2455": {
"content": "<np_classifier_superclass:Small peptides>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2456": {
"content": "<np_classifier_superclass:Sphingolipids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2457": {
"content": "<np_classifier_superclass:Steroids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2458": {
"content": "<np_classifier_superclass:Stilbenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2459": {
"content": "<np_classifier_superclass:Styrylpyrones>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2460": {
"content": "<np_classifier_superclass:Terphenyls>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2461": {
"content": "<np_classifier_superclass:Tetramate alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2462": {
"content": "<np_classifier_superclass:Triterpenoids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2463": {
"content": "<np_classifier_superclass:Tropolones>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2464": {
"content": "<np_classifier_superclass:Tryptophan alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2465": {
"content": "<np_classifier_superclass:Tyrosine alkaloids>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2466": {
"content": "<np_classifier_superclass:Xanthones>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2467": {
"content": "<np_classifier_superclass:β-lactams>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2468": {
"content": "<np_classifier_superclass:γ-lactam-β-lactones>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2469": {
"content": "<qed_bin:0.1<=qed<0.2>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2470": {
"content": "<qed_bin:0.2<=qed<0.3>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2471": {
"content": "<qed_bin:0.3<=qed<0.4>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2472": {
"content": "<qed_bin:0.4<=qed<0.5>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2473": {
"content": "<qed_bin:0.5<=qed<0.6>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2474": {
"content": "<qed_bin:0.6<=qed<0.7>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2475": {
"content": "<qed_bin:0.7<=qed<0.8>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2476": {
"content": "<qed_bin:0.8<=qed<0.9>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2477": {
"content": "<qed_bin:0.9<=qed<1>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2478": {
"content": "<qed_bin:0<=qed<0.1>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2479": {
"content": "<sa_bin:1<=sa<2>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2480": {
"content": "<sa_bin:2<=sa<3>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2481": {
"content": "<sa_bin:3<=sa<4>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2482": {
"content": "<sa_bin:4<=sa<5>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2483": {
"content": "<sa_bin:5<=sa<6>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2484": {
"content": "<sa_bin:6<=sa<7>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2485": {
"content": "<sa_bin:7<=sa<8>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2486": {
"content": "<sa_bin:8<=sa<9>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2487": {
"content": "<sa_bin:9<=sa<10>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
}
},
"additional_special_tokens": [
"<aromatic_rings_count:0>",
"<aromatic_rings_count:10>",
"<aromatic_rings_count:11>",
"<aromatic_rings_count:12>",
"<aromatic_rings_count:13>",
"<aromatic_rings_count:14>",
"<aromatic_rings_count:15>",
"<aromatic_rings_count:16>",
"<aromatic_rings_count:17>",
"<aromatic_rings_count:18>",
"<aromatic_rings_count:19>",
"<aromatic_rings_count:1>",
"<aromatic_rings_count:20>",
"<aromatic_rings_count:22>",
"<aromatic_rings_count:2>",
"<aromatic_rings_count:3>",
"<aromatic_rings_count:4>",
"<aromatic_rings_count:5>",
"<aromatic_rings_count:6>",
"<aromatic_rings_count:7>",
"<aromatic_rings_count:8>",
"<aromatic_rings_count:9>",
"<np_classifier_is_glycoside:False>",
"<np_classifier_is_glycoside:True>",
"<np_classifier_pathway:Alkaloids>",
"<np_classifier_pathway:Amino acids and Peptides>",
"<np_classifier_pathway:Carbohydrates>",
"<np_classifier_pathway:Fatty acids>",
"<np_classifier_pathway:Polyketides>",
"<np_classifier_pathway:Shikimates and Phenylpropanoids>",
"<np_classifier_pathway:Terpenoids>",
"<np_classifier_superclass:Alkylresorcinols>",
"<np_classifier_superclass:Amino acid glycosides>",
"<np_classifier_superclass:Aminosugars and aminoglycosides>",
"<np_classifier_superclass:Anthranilic acid alkaloids>",
"<np_classifier_superclass:Apocarotenoids>",
"<np_classifier_superclass:Aromatic polyketides>",
"<np_classifier_superclass:Carotenoids (C40)>",
"<np_classifier_superclass:Carotenoids (C45)>",
"<np_classifier_superclass:Carotenoids (C50)>",
"<np_classifier_superclass:Chromanes>",
"<np_classifier_superclass:Coumarins>",
"<np_classifier_superclass:Cyclic polyketides>",
"<np_classifier_superclass:Diarylheptanoids>",
"<np_classifier_superclass:Diazotetronic acids and derivatives>",
"<np_classifier_superclass:Diphenyl ethers (DPEs)>",
"<np_classifier_superclass:Diterpenoids>",
"<np_classifier_superclass:Docosanoids>",
"<np_classifier_superclass:Eicosanoids>",
"<np_classifier_superclass:Fatty Acids and Conjugates>",
"<np_classifier_superclass:Fatty acyl glycosides>",
"<np_classifier_superclass:Fatty acyls>",
"<np_classifier_superclass:Fatty amides>",
"<np_classifier_superclass:Fatty esters>",
"<np_classifier_superclass:Flavonoids>",
"<np_classifier_superclass:Fluorenes>",
"<np_classifier_superclass:Glycerolipids>",
"<np_classifier_superclass:Glycerophospholipids>",
"<np_classifier_superclass:Guanidine alkaloids>",
"<np_classifier_superclass:Histidine alkaloids>",
"<np_classifier_superclass:Isoflavonoids>",
"<np_classifier_superclass:Lignans>",
"<np_classifier_superclass:Linear polyketides>",
"<np_classifier_superclass:Lysine alkaloids>",
"<np_classifier_superclass:Macrolides>",
"<np_classifier_superclass:Meroterpenoids>",
"<np_classifier_superclass:Miscellaneous alkaloids>",
"<np_classifier_superclass:Miscellaneous polyketides>",
"<np_classifier_superclass:Mitomycin derivatives>",
"<np_classifier_superclass:Monoterpenoids>",
"<np_classifier_superclass:Mycosporine derivatives>",
"<np_classifier_superclass:Naphthalenes>",
"<np_classifier_superclass:Nicotinic acid alkaloids>",
"<np_classifier_superclass:Nucleosides>",
"<np_classifier_superclass:Octadecanoids>",
"<np_classifier_superclass:Oligopeptides>",
"<np_classifier_superclass:Ornithine alkaloids>",
"<np_classifier_superclass:Peptide alkaloids>",
"<np_classifier_superclass:Phenanthrenoids>",
"<np_classifier_superclass:Phenolic acids (C6-C1)>",
"<np_classifier_superclass:Phenylethanoids (C6-C2)>",
"<np_classifier_superclass:Phenylpropanoids (C6-C3)>",
"<np_classifier_superclass:Phloroglucinols>",
"<np_classifier_superclass:Polycyclic aromatic polyketides>",
"<np_classifier_superclass:Polyethers>",
"<np_classifier_superclass:Polyols>",
"<np_classifier_superclass:Polyprenols>",
"<np_classifier_superclass:Proline alkaloids>",
"<np_classifier_superclass:Pseudoalkaloids>",
"<np_classifier_superclass:Saccharides>",
"<np_classifier_superclass:Serine alkaloids>",
"<np_classifier_superclass:Sesquiterpenoids>",
"<np_classifier_superclass:Sesterterpenoids>",
"<np_classifier_superclass:Small peptides>",
"<np_classifier_superclass:Sphingolipids>",
"<np_classifier_superclass:Steroids>",
"<np_classifier_superclass:Stilbenoids>",
"<np_classifier_superclass:Styrylpyrones>",
"<np_classifier_superclass:Terphenyls>",
"<np_classifier_superclass:Tetramate alkaloids>",
"<np_classifier_superclass:Triterpenoids>",
"<np_classifier_superclass:Tropolones>",
"<np_classifier_superclass:Tryptophan alkaloids>",
"<np_classifier_superclass:Tyrosine alkaloids>",
"<np_classifier_superclass:Xanthones>",
"<np_classifier_superclass:β-lactams>",
"<np_classifier_superclass:γ-lactam-β-lactones>",
"<qed_bin:0.1<=qed<0.2>",
"<qed_bin:0.2<=qed<0.3>",
"<qed_bin:0.3<=qed<0.4>",
"<qed_bin:0.4<=qed<0.5>",
"<qed_bin:0.5<=qed<0.6>",
"<qed_bin:0.6<=qed<0.7>",
"<qed_bin:0.7<=qed<0.8>",
"<qed_bin:0.8<=qed<0.9>",
"<qed_bin:0.9<=qed<1>",
"<qed_bin:0<=qed<0.1>",
"<sa_bin:1<=sa<2>",
"<sa_bin:2<=sa<3>",
"<sa_bin:3<=sa<4>",
"<sa_bin:4<=sa<5>",
"<sa_bin:5<=sa<6>",
"<sa_bin:6<=sa<7>",
"<sa_bin:7<=sa<8>",
"<sa_bin:8<=sa<9>",
"<sa_bin:9<=sa<10>"
],
"auto_map": {
"AutoTokenizer": [
"ibm-research/MoLFormer-XL-both-10pct--tokenization_molformer.MolformerTokenizer",
"ibm-research/MoLFormer-XL-both-10pct--tokenization_molformer_fast.MolformerTokenizerFast"
]
},
"clean_up_tokenization_spaces": true,
"cls_token": "<bos>",
"mask_token": "<mask>",
"model_max_length": 1000000000000000019884624838656,
"pad_token": "<pad>",
"sep_token": "<eos>",
"tokenizer_class": "MolformerTokenizer",
"unk_token": "<unk>"
}