Synthyra
/

DPLM2-3B

@@ -1,20 +1,21 @@
 {
-  "_name_or_path": "airkingbd/dplm_3b",
   "aa_type": 1,
   "architectures": [
     "DPLM2ForMaskedLM"
   ],
   "attention_probs_dropout_prob": 0.0,
   "attn_backend": "sdpa",
   "auto_map": {
-    "AutoConfig": "dplm2.DPLM2Config",
-    "AutoModel": "dplm2.DPLM2Model",
-    "AutoModelForMaskedLM": "dplm2.DPLM2ForMaskedLM",
-    "AutoModelForSequenceClassification": "dplm2.DPLM2ForSequenceClassification",
-    "AutoModelForTokenClassification": "dplm2.DPLM2ForTokenClassification"
   },
   "classifier_dropout": null,
   "dplm_type": "dplm_esm",
   "emb_layer_norm_before": false,
   "esmfold_config": null,
   "hidden_act": "gelu",
@@ -22,6 +23,7 @@
   "hidden_size": 2560,
   "initializer_range": 0.02,
   "intermediate_size": 10240,
   "is_folding_model": false,
   "layer_norm_eps": 1e-05,
   "mask_token_id": 32,
@@ -35,8 +37,7 @@
   "struct_type": 0,
   "tie_word_embeddings": false,
   "token_dropout": true,
-  "torch_dtype": "float32",
-  "transformers_version": "4.48.1",
   "use_cache": true,
   "vocab_list": null,
   "vocab_size": 8229

 {
   "aa_type": 1,
+  "add_cross_attention": false,
   "architectures": [
     "DPLM2ForMaskedLM"
   ],
   "attention_probs_dropout_prob": 0.0,
   "attn_backend": "sdpa",
   "auto_map": {
+    "AutoConfig": "modeling_dplm2.DPLM2Config",
+    "AutoModel": "modeling_dplm2.DPLM2Model",
+    "AutoModelForMaskedLM": "modeling_dplm2.DPLM2ForMaskedLM",
+    "AutoModelForSequenceClassification": "modeling_dplm2.DPLM2ForSequenceClassification",
+    "AutoModelForTokenClassification": "modeling_dplm2.DPLM2ForTokenClassification"
   },
   "classifier_dropout": null,
   "dplm_type": "dplm_esm",
+  "dtype": "float32",
   "emb_layer_norm_before": false,
   "esmfold_config": null,
   "hidden_act": "gelu",
   "hidden_size": 2560,
   "initializer_range": 0.02,
   "intermediate_size": 10240,
+  "is_decoder": false,
   "is_folding_model": false,
   "layer_norm_eps": 1e-05,
   "mask_token_id": 32,
   "struct_type": 0,
   "tie_word_embeddings": false,
   "token_dropout": true,
+  "transformers_version": "5.2.0",
   "use_cache": true,
   "vocab_list": null,
   "vocab_size": 8229

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:77767a93408a01e8485ae27b008712aa8dbd6fa4221f97879a2703d45489e9be
+size 11524320476