Synthyra
/

DPLM2-650M

Model card Files Files and versions

lhallee commited on Feb 19

Commit

d753c1f

·

verified ·

1 Parent(s): 7566dce

Upload DPLM2ForMaskedLM

Files changed (2) hide show

config.json +9 -8
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -1,20 +1,21 @@
 {
-  "_name_or_path": "facebook/esm2_t33_650M_UR50D",
   "aa_type": 1,
   "architectures": [
     "DPLM2ForMaskedLM"
   ],
   "attention_probs_dropout_prob": 0.0,
   "attn_backend": "sdpa",
   "auto_map": {
-    "AutoConfig": "dplm2.DPLM2Config",
-    "AutoModel": "dplm2.DPLM2Model",
-    "AutoModelForMaskedLM": "dplm2.DPLM2ForMaskedLM",
-    "AutoModelForSequenceClassification": "dplm2.DPLM2ForSequenceClassification",
-    "AutoModelForTokenClassification": "dplm2.DPLM2ForTokenClassification"
   },
   "classifier_dropout": null,
   "dplm_type": "dplm2_esm",
   "emb_layer_norm_before": false,
   "esmfold_config": null,
   "hidden_act": "gelu",
@@ -22,6 +23,7 @@
   "hidden_size": 1280,
   "initializer_range": 0.02,
   "intermediate_size": 5120,
   "is_folding_model": false,
   "layer_norm_eps": 1e-05,
   "mask_token_id": 32,
@@ -35,8 +37,7 @@
   "struct_type": 0,
   "tie_word_embeddings": false,
   "token_dropout": true,
-  "torch_dtype": "float32",
-  "transformers_version": "4.48.1",
   "use_cache": true,
   "vocab_list": null,
   "vocab_size": 8229

 {
   "aa_type": 1,
+  "add_cross_attention": false,
   "architectures": [
     "DPLM2ForMaskedLM"
   ],
   "attention_probs_dropout_prob": 0.0,
   "attn_backend": "sdpa",
   "auto_map": {
+    "AutoConfig": "modeling_dplm2.DPLM2Config",
+    "AutoModel": "modeling_dplm2.DPLM2Model",
+    "AutoModelForMaskedLM": "modeling_dplm2.DPLM2ForMaskedLM",
+    "AutoModelForSequenceClassification": "modeling_dplm2.DPLM2ForSequenceClassification",
+    "AutoModelForTokenClassification": "modeling_dplm2.DPLM2ForTokenClassification"
   },
   "classifier_dropout": null,
   "dplm_type": "dplm2_esm",
+  "dtype": "float32",
   "emb_layer_norm_before": false,
   "esmfold_config": null,
   "hidden_act": "gelu",
   "hidden_size": 1280,
   "initializer_range": 0.02,
   "intermediate_size": 5120,
+  "is_decoder": false,
   "is_folding_model": false,
   "layer_norm_eps": 1e-05,
   "mask_token_id": 32,
   "struct_type": 0,
   "tie_word_embeddings": false,
   "token_dropout": true,
+  "transformers_version": "5.2.0",
   "use_cache": true,
   "vocab_list": null,
   "vocab_size": 8229

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8d0513a06dca00ad19004d9285803b99def257a6ba49d85aefd255def63a05c5
-size 2693624204

 version https://git-lfs.github.com/spec/v1
+oid sha256:92db08c7dbfd6c5e03fbfeaea3f36b09640ee794dcf5ea8d550527869a9f1d63
+size 2688370964