ModChemBERT-MLM-DAPT / config.json
eacortes's picture
Upload 19 files
297a8a9 verified
{
"architectures": [
"ModChemBertForMaskedLM",
"ModChemBertForSequenceClassification"
],
"attention_bias": false,
"attention_dropout": 0.1,
"auto_map": {
"AutoConfig": "configuration_modchembert.ModChemBertConfig",
"AutoModelForMaskedLM": "modeling_modchembert.ModChemBertForMaskedLM",
"AutoModelForSequenceClassification": "modeling_modchembert.ModChemBertForSequenceClassification"
},
"bos_token_id": 0,
"classifier_activation": "gelu",
"classifier_bias": false,
"classifier_dropout": 0.0,
"classifier_pooling": "max_seq_mha",
"classifier_pooling_attention_dropout": 0.1,
"classifier_pooling_last_k": 3,
"classifier_pooling_num_attention_heads": 4,
"cls_token_id": 0,
"decoder_bias": true,
"deterministic_flash_attn": false,
"dtype": "bfloat16",
"embedding_dropout": 0.1,
"eos_token_id": 1,
"global_attn_every_n_layers": 3,
"global_rope_theta": 160000.0,
"hidden_activation": "gelu",
"hidden_size": 768,
"id2label": {
"0": "MaxAbsEStateIndex",
"1": "MaxEStateIndex",
"2": "MinAbsEStateIndex",
"3": "MinEStateIndex",
"4": "qed",
"5": "SPS",
"6": "MolWt",
"7": "HeavyAtomMolWt",
"8": "ExactMolWt",
"9": "NumValenceElectrons",
"10": "MaxPartialCharge",
"11": "MinPartialCharge",
"12": "MaxAbsPartialCharge",
"13": "MinAbsPartialCharge",
"14": "FpDensityMorgan1",
"15": "FpDensityMorgan2",
"16": "FpDensityMorgan3",
"17": "BCUT2D_MWHI",
"18": "BCUT2D_MWLOW",
"19": "BCUT2D_CHGHI",
"20": "BCUT2D_CHGLO",
"21": "BCUT2D_LOGPHI",
"22": "BCUT2D_LOGPLOW",
"23": "BCUT2D_MRHI",
"24": "BCUT2D_MRLOW",
"25": "AvgIpc",
"26": "BalabanJ",
"27": "BertzCT",
"28": "Chi0",
"29": "Chi0n",
"30": "Chi0v",
"31": "Chi1",
"32": "Chi1n",
"33": "Chi1v",
"34": "Chi2n",
"35": "Chi2v",
"36": "Chi3n",
"37": "Chi3v",
"38": "Chi4n",
"39": "Chi4v",
"40": "HallKierAlpha",
"41": "Kappa1",
"42": "Kappa2",
"43": "Kappa3",
"44": "LabuteASA",
"45": "PEOE_VSA1",
"46": "PEOE_VSA10",
"47": "PEOE_VSA11",
"48": "PEOE_VSA12",
"49": "PEOE_VSA13",
"50": "PEOE_VSA14",
"51": "PEOE_VSA2",
"52": "PEOE_VSA3",
"53": "PEOE_VSA4",
"54": "PEOE_VSA5",
"55": "PEOE_VSA6",
"56": "PEOE_VSA7",
"57": "PEOE_VSA8",
"58": "PEOE_VSA9",
"59": "SMR_VSA1",
"60": "SMR_VSA10",
"61": "SMR_VSA2",
"62": "SMR_VSA3",
"63": "SMR_VSA4",
"64": "SMR_VSA5",
"65": "SMR_VSA6",
"66": "SMR_VSA7",
"67": "SMR_VSA9",
"68": "SlogP_VSA1",
"69": "SlogP_VSA10",
"70": "SlogP_VSA11",
"71": "SlogP_VSA12",
"72": "SlogP_VSA2",
"73": "SlogP_VSA3",
"74": "SlogP_VSA4",
"75": "SlogP_VSA5",
"76": "SlogP_VSA6",
"77": "SlogP_VSA7",
"78": "SlogP_VSA8",
"79": "TPSA",
"80": "EState_VSA1",
"81": "EState_VSA10",
"82": "EState_VSA11",
"83": "EState_VSA2",
"84": "EState_VSA3",
"85": "EState_VSA4",
"86": "EState_VSA5",
"87": "EState_VSA6",
"88": "EState_VSA7",
"89": "EState_VSA8",
"90": "EState_VSA9",
"91": "VSA_EState1",
"92": "VSA_EState10",
"93": "VSA_EState2",
"94": "VSA_EState3",
"95": "VSA_EState4",
"96": "VSA_EState5",
"97": "VSA_EState6",
"98": "VSA_EState7",
"99": "VSA_EState8",
"100": "VSA_EState9",
"101": "FractionCSP3",
"102": "HeavyAtomCount",
"103": "NHOHCount",
"104": "NOCount",
"105": "NumAliphaticCarbocycles",
"106": "NumAliphaticHeterocycles",
"107": "NumAliphaticRings",
"108": "NumAmideBonds",
"109": "NumAromaticCarbocycles",
"110": "NumAromaticHeterocycles",
"111": "NumAromaticRings",
"112": "NumAtomStereoCenters",
"113": "NumBridgeheadAtoms",
"114": "NumHAcceptors",
"115": "NumHDonors",
"116": "NumHeteroatoms",
"117": "NumHeterocycles",
"118": "NumRotatableBonds",
"119": "NumSaturatedCarbocycles",
"120": "NumSaturatedHeterocycles",
"121": "NumSaturatedRings",
"122": "NumSpiroAtoms",
"123": "NumUnspecifiedAtomStereoCenters",
"124": "Phi",
"125": "RingCount",
"126": "MolLogP",
"127": "MolMR",
"128": "fr_Al_COO",
"129": "fr_Al_OH",
"130": "fr_Al_OH_noTert",
"131": "fr_ArN",
"132": "fr_Ar_COO",
"133": "fr_Ar_N",
"134": "fr_Ar_NH",
"135": "fr_Ar_OH",
"136": "fr_COO",
"137": "fr_COO2",
"138": "fr_C_O",
"139": "fr_C_O_noCOO",
"140": "fr_C_S",
"141": "fr_HOCCN",
"142": "fr_Imine",
"143": "fr_NH0",
"144": "fr_NH1",
"145": "fr_NH2",
"146": "fr_N_O",
"147": "fr_Ndealkylation1",
"148": "fr_Ndealkylation2",
"149": "fr_Nhpyrrole",
"150": "fr_SH",
"151": "fr_aldehyde",
"152": "fr_alkyl_carbamate",
"153": "fr_alkyl_halide",
"154": "fr_allylic_oxid",
"155": "fr_amide",
"156": "fr_amidine",
"157": "fr_aniline",
"158": "fr_aryl_methyl",
"159": "fr_azide",
"160": "fr_azo",
"161": "fr_barbitur",
"162": "fr_benzene",
"163": "fr_benzodiazepine",
"164": "fr_bicyclic",
"165": "fr_dihydropyridine",
"166": "fr_epoxide",
"167": "fr_ester",
"168": "fr_ether",
"169": "fr_furan",
"170": "fr_guanido",
"171": "fr_halogen",
"172": "fr_hdrzine",
"173": "fr_hdrzone",
"174": "fr_imidazole",
"175": "fr_imide",
"176": "fr_ketone",
"177": "fr_ketone_Topliss",
"178": "fr_lactam",
"179": "fr_lactone",
"180": "fr_methoxy",
"181": "fr_morpholine",
"182": "fr_nitrile",
"183": "fr_nitro",
"184": "fr_nitro_arom",
"185": "fr_nitro_arom_nonortho",
"186": "fr_oxazole",
"187": "fr_oxime",
"188": "fr_para_hydroxylation",
"189": "fr_phenol",
"190": "fr_phenol_noOrthoHbond",
"191": "fr_phos_acid",
"192": "fr_phos_ester",
"193": "fr_piperdine",
"194": "fr_piperzine",
"195": "fr_priamide",
"196": "fr_pyridine",
"197": "fr_quatN",
"198": "fr_sulfide",
"199": "fr_sulfonamd",
"200": "fr_sulfone",
"201": "fr_term_acetylene",
"202": "fr_tetrazole",
"203": "fr_thiazole",
"204": "fr_thiophene",
"205": "fr_unbrch_alkane",
"206": "fr_urea"
},
"initializer_cutoff_factor": 2.0,
"initializer_range": 0.02,
"intermediate_size": 1152,
"label2id": {
"AvgIpc": 25,
"BCUT2D_CHGHI": 19,
"BCUT2D_CHGLO": 20,
"BCUT2D_LOGPHI": 21,
"BCUT2D_LOGPLOW": 22,
"BCUT2D_MRHI": 23,
"BCUT2D_MRLOW": 24,
"BCUT2D_MWHI": 17,
"BCUT2D_MWLOW": 18,
"BalabanJ": 26,
"BertzCT": 27,
"Chi0": 28,
"Chi0n": 29,
"Chi0v": 30,
"Chi1": 31,
"Chi1n": 32,
"Chi1v": 33,
"Chi2n": 34,
"Chi2v": 35,
"Chi3n": 36,
"Chi3v": 37,
"Chi4n": 38,
"Chi4v": 39,
"EState_VSA1": 80,
"EState_VSA10": 81,
"EState_VSA11": 82,
"EState_VSA2": 83,
"EState_VSA3": 84,
"EState_VSA4": 85,
"EState_VSA5": 86,
"EState_VSA6": 87,
"EState_VSA7": 88,
"EState_VSA8": 89,
"EState_VSA9": 90,
"ExactMolWt": 8,
"FpDensityMorgan1": 14,
"FpDensityMorgan2": 15,
"FpDensityMorgan3": 16,
"FractionCSP3": 101,
"HallKierAlpha": 40,
"HeavyAtomCount": 102,
"HeavyAtomMolWt": 7,
"Kappa1": 41,
"Kappa2": 42,
"Kappa3": 43,
"LabuteASA": 44,
"MaxAbsEStateIndex": 0,
"MaxAbsPartialCharge": 12,
"MaxEStateIndex": 1,
"MaxPartialCharge": 10,
"MinAbsEStateIndex": 2,
"MinAbsPartialCharge": 13,
"MinEStateIndex": 3,
"MinPartialCharge": 11,
"MolLogP": 126,
"MolMR": 127,
"MolWt": 6,
"NHOHCount": 103,
"NOCount": 104,
"NumAliphaticCarbocycles": 105,
"NumAliphaticHeterocycles": 106,
"NumAliphaticRings": 107,
"NumAmideBonds": 108,
"NumAromaticCarbocycles": 109,
"NumAromaticHeterocycles": 110,
"NumAromaticRings": 111,
"NumAtomStereoCenters": 112,
"NumBridgeheadAtoms": 113,
"NumHAcceptors": 114,
"NumHDonors": 115,
"NumHeteroatoms": 116,
"NumHeterocycles": 117,
"NumRotatableBonds": 118,
"NumSaturatedCarbocycles": 119,
"NumSaturatedHeterocycles": 120,
"NumSaturatedRings": 121,
"NumSpiroAtoms": 122,
"NumUnspecifiedAtomStereoCenters": 123,
"NumValenceElectrons": 9,
"PEOE_VSA1": 45,
"PEOE_VSA10": 46,
"PEOE_VSA11": 47,
"PEOE_VSA12": 48,
"PEOE_VSA13": 49,
"PEOE_VSA14": 50,
"PEOE_VSA2": 51,
"PEOE_VSA3": 52,
"PEOE_VSA4": 53,
"PEOE_VSA5": 54,
"PEOE_VSA6": 55,
"PEOE_VSA7": 56,
"PEOE_VSA8": 57,
"PEOE_VSA9": 58,
"Phi": 124,
"RingCount": 125,
"SMR_VSA1": 59,
"SMR_VSA10": 60,
"SMR_VSA2": 61,
"SMR_VSA3": 62,
"SMR_VSA4": 63,
"SMR_VSA5": 64,
"SMR_VSA6": 65,
"SMR_VSA7": 66,
"SMR_VSA9": 67,
"SPS": 5,
"SlogP_VSA1": 68,
"SlogP_VSA10": 69,
"SlogP_VSA11": 70,
"SlogP_VSA12": 71,
"SlogP_VSA2": 72,
"SlogP_VSA3": 73,
"SlogP_VSA4": 74,
"SlogP_VSA5": 75,
"SlogP_VSA6": 76,
"SlogP_VSA7": 77,
"SlogP_VSA8": 78,
"TPSA": 79,
"VSA_EState1": 91,
"VSA_EState10": 92,
"VSA_EState2": 93,
"VSA_EState3": 94,
"VSA_EState4": 95,
"VSA_EState5": 96,
"VSA_EState6": 97,
"VSA_EState7": 98,
"VSA_EState8": 99,
"VSA_EState9": 100,
"fr_Al_COO": 128,
"fr_Al_OH": 129,
"fr_Al_OH_noTert": 130,
"fr_ArN": 131,
"fr_Ar_COO": 132,
"fr_Ar_N": 133,
"fr_Ar_NH": 134,
"fr_Ar_OH": 135,
"fr_COO": 136,
"fr_COO2": 137,
"fr_C_O": 138,
"fr_C_O_noCOO": 139,
"fr_C_S": 140,
"fr_HOCCN": 141,
"fr_Imine": 142,
"fr_NH0": 143,
"fr_NH1": 144,
"fr_NH2": 145,
"fr_N_O": 146,
"fr_Ndealkylation1": 147,
"fr_Ndealkylation2": 148,
"fr_Nhpyrrole": 149,
"fr_SH": 150,
"fr_aldehyde": 151,
"fr_alkyl_carbamate": 152,
"fr_alkyl_halide": 153,
"fr_allylic_oxid": 154,
"fr_amide": 155,
"fr_amidine": 156,
"fr_aniline": 157,
"fr_aryl_methyl": 158,
"fr_azide": 159,
"fr_azo": 160,
"fr_barbitur": 161,
"fr_benzene": 162,
"fr_benzodiazepine": 163,
"fr_bicyclic": 164,
"fr_dihydropyridine": 165,
"fr_epoxide": 166,
"fr_ester": 167,
"fr_ether": 168,
"fr_furan": 169,
"fr_guanido": 170,
"fr_halogen": 171,
"fr_hdrzine": 172,
"fr_hdrzone": 173,
"fr_imidazole": 174,
"fr_imide": 175,
"fr_ketone": 176,
"fr_ketone_Topliss": 177,
"fr_lactam": 178,
"fr_lactone": 179,
"fr_methoxy": 180,
"fr_morpholine": 181,
"fr_nitrile": 182,
"fr_nitro": 183,
"fr_nitro_arom": 184,
"fr_nitro_arom_nonortho": 185,
"fr_oxazole": 186,
"fr_oxime": 187,
"fr_para_hydroxylation": 188,
"fr_phenol": 189,
"fr_phenol_noOrthoHbond": 190,
"fr_phos_acid": 191,
"fr_phos_ester": 192,
"fr_piperdine": 193,
"fr_piperzine": 194,
"fr_priamide": 195,
"fr_pyridine": 196,
"fr_quatN": 197,
"fr_sulfide": 198,
"fr_sulfonamd": 199,
"fr_sulfone": 200,
"fr_term_acetylene": 201,
"fr_tetrazole": 202,
"fr_thiazole": 203,
"fr_thiophene": 204,
"fr_unbrch_alkane": 205,
"fr_urea": 206,
"qed": 4
},
"layer_norm_eps": 1e-05,
"local_attention": 8,
"local_rope_theta": 10000.0,
"max_position_embeddings": 256,
"mlp_bias": false,
"mlp_dropout": 0.1,
"model_type": "modchembert",
"norm_bias": false,
"norm_eps": 1e-05,
"num_attention_heads": 12,
"num_hidden_layers": 22,
"num_labels": 207,
"pad_token_id": 2,
"position_embedding_type": "absolute",
"problem_type": "regression",
"repad_logits_with_grad": false,
"sep_token_id": 1,
"sparse_pred_ignore_index": -100,
"sparse_prediction": false,
"transformers_version": "4.56.1",
"vocab_size": 2362
}