| { | |
| "module": "keras_hub.src.models.esm.esm_masked_plm", | |
| "class_name": "ESMMaskedPLM", | |
| "config": { | |
| "backbone": { | |
| "module": "keras_hub.src.models.esm.esm_backbone", | |
| "class_name": "ESMBackbone", | |
| "config": { | |
| "name": "esm_backbone", | |
| "trainable": true, | |
| "vocabulary_size": 33, | |
| "num_layers": 33, | |
| "num_heads": 20, | |
| "hidden_dim": 1280, | |
| "intermediate_dim": 5120, | |
| "dropout": 0.0, | |
| "max_wavelength": 10000, | |
| "use_bias": true, | |
| "activation": "gelu", | |
| "layer_norm_eps": 1e-05, | |
| "use_pre_layer_norm": false, | |
| "position_embedding_type": "rotary", | |
| "max_sequence_length": 1026, | |
| "pad_token_id": 1 | |
| }, | |
| "registered_name": "keras_hub>ESMBackbone" | |
| }, | |
| "preprocessor": { | |
| "module": "keras_hub.src.models.esm.esm_masked_plm_preprocessor", | |
| "class_name": "ESMMaskedPLMPreprocessor", | |
| "config": { | |
| "name": "esm_masked_plm_preprocessor_1", | |
| "trainable": true, | |
| "dtype": { | |
| "module": "keras", | |
| "class_name": "DTypePolicy", | |
| "config": { | |
| "name": "float32" | |
| }, | |
| "registered_name": null | |
| }, | |
| "tokenizer": { | |
| "module": "keras_hub.src.models.esm.esm_tokenizer", | |
| "class_name": "ESMTokenizer", | |
| "config": { | |
| "name": "esm_tokenizer", | |
| "trainable": true, | |
| "dtype": { | |
| "module": "keras", | |
| "class_name": "DTypePolicy", | |
| "config": { | |
| "name": "int32" | |
| }, | |
| "registered_name": null | |
| }, | |
| "config_file": "tokenizer.json", | |
| "vocabulary": null, | |
| "sequence_length": null, | |
| "lowercase": false, | |
| "strip_accents": false, | |
| "split": true, | |
| "suffix_indicator": "##", | |
| "oov_token": "<unk>", | |
| "special_tokens": null, | |
| "special_tokens_in_strings": false | |
| }, | |
| "registered_name": "keras_hub>ESMTokenizer" | |
| }, | |
| "config_file": "preprocessor.json", | |
| "sequence_length": 512, | |
| "truncate": "round_robin", | |
| "mask_selection_rate": 0.15, | |
| "mask_selection_length": 96, | |
| "mask_token_rate": 0.8, | |
| "random_token_rate": 0.1 | |
| }, | |
| "registered_name": "keras_hub>ESMMaskedPLMPreprocessor" | |
| }, | |
| "name": "esm_masked_plm" | |
| }, | |
| "registered_name": "keras_hub>ESMMaskedPLM" | |
| } |