TerenceLau
/

sparrow

Model card Files Files and versions

TerenceLau commited on Feb 9, 2025

Commit

ae79607

·

verified ·

1 Parent(s): c978865

Upload model

Files changed (2) hide show

config.json +3 -5
pytorch_model.bin +1 -1

config.json CHANGED Viewed

@@ -1,11 +1,9 @@
 {
   "architectures": [
-    "SparrowModel"
   ],
   "attention_bias": false,
-  "auto_map": {
-    "AutoConfig": "modelling_sparrow.SparrowConfig"
-  },
   "dropout": 0.0,
   "flash_attn": true,
   "hidden_dim": 512,
@@ -14,7 +12,7 @@
   "max_seq_len": 512,
   "mlp_bias": false,
   "model_type": "sparrow",
-  "norm_eps": 1e-05,
   "num_attention_heads": 16,
   "num_hidden_layers": 8,
   "num_key_value_heads": 16,

 {
+  "_name_or_path": "/data/sparrow/model/pretrain/",
   "architectures": [
+    "SparrowModelForCausalLM"
   ],
   "attention_bias": false,
   "dropout": 0.0,
   "flash_attn": true,
   "hidden_dim": 512,
   "max_seq_len": 512,
   "mlp_bias": false,
   "model_type": "sparrow",
+  "norm_eps": "1e-5",
   "num_attention_heads": 16,
   "num_hidden_layers": 8,
   "num_key_value_heads": 16,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:177c43fde459c6e4f610c58e282c98b8563f387f0db5bb1db3495948206cc82e
 size 204011452

 version https://git-lfs.github.com/spec/v1
+oid sha256:3f24f36c610a73c1b64408eef0ca529c4a87e8461cf17446e276eb2ee26b8ebc
 size 204011452