facebook
/

pe-av-base

Model card Files Files and versions

Upload model

#5

by eustlb HF Staff - opened Jan 29

base: refs/heads/main

←

from: refs/pr/5

Discussion Files changed

Files changed (2) hide show

config.json +9 -1
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -112,6 +112,7 @@
       "tie_word_embeddings": true,
       "tokenizer_class": null
     },
     "head_dim": 128,
     "hidden_act": "silu",
     "hidden_size": 1024,
@@ -1241,6 +1242,7 @@
   "text_config": {
     "attention_bias": false,
     "attention_dropout": 0.0,
     "classifier_activation": "gelu",
     "classifier_bias": false,
     "classifier_dropout": 0.0,
@@ -1248,7 +1250,9 @@
     "cls_token_id": 50281,
     "decoder_bias": true,
     "deterministic_flash_attn": false,
     "embedding_dropout": 0.0,
     "global_attn_every_n_layers": 3,
     "hidden_activation": "gelu",
     "hidden_size": 1024,
@@ -1288,6 +1292,7 @@
     "norm_eps": 1e-05,
     "num_attention_heads": 16,
     "num_hidden_layers": 22,
     "repad_logits_with_grad": false,
     "rope_parameters": {
       "full_attention": {
@@ -1299,9 +1304,12 @@
         "rope_type": "default"
       }
     },
     "sparse_pred_ignore_index": -100,
     "sparse_prediction": false,
     "vocab_size": 50368
   },
-  "transformers_version": "5.0.0.dev0"
 }

       "tie_word_embeddings": true,
       "tokenizer_class": null
     },
+    "dtype": "float32",
     "head_dim": 128,
     "hidden_act": "silu",
     "hidden_size": 1024,
   "text_config": {
     "attention_bias": false,
     "attention_dropout": 0.0,
+    "bos_token_id": 50281,
     "classifier_activation": "gelu",
     "classifier_bias": false,
     "classifier_dropout": 0.0,
     "cls_token_id": 50281,
     "decoder_bias": true,
     "deterministic_flash_attn": false,
+    "dtype": "float32",
     "embedding_dropout": 0.0,
+    "eos_token_id": 50282,
     "global_attn_every_n_layers": 3,
     "hidden_activation": "gelu",
     "hidden_size": 1024,
     "norm_eps": 1e-05,
     "num_attention_heads": 16,
     "num_hidden_layers": 22,
+    "pad_token_id": 50283,
     "repad_logits_with_grad": false,
     "rope_parameters": {
       "full_attention": {
         "rope_type": "default"
       }
     },
+    "sep_token_id": 50282,
     "sparse_pred_ignore_index": -100,
     "sparse_prediction": false,
+    "tie_word_embeddings": true,
     "vocab_size": 50368
   },
+  "tie_word_embeddings": true,
+  "transformers_version": "5.0.1.dev0"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fa8046961d09730df10c0c2707565c9610a671643a6a064c42985aa26b2dbcd3
-size 9162993936

 version https://git-lfs.github.com/spec/v1
+oid sha256:c87718fb93e00f3b2e5c886b3a6a589ee3bc3d29ea0c1a2e1f6b1e141c19170e
+size 4134930120