rozariwang commited on
Commit
10aa356
·
verified ·
1 Parent(s): 759dc29

Upload 4 files

Browse files
Files changed (4) hide show
  1. config.json +16 -0
  2. model.safetensors +3 -0
  3. pytorch_model.bin +3 -0
  4. vocab.json +0 -0
config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "d_model": 512,
3
+ "d_intermediate": 2048,
4
+ "n_layer": 12,
5
+ "vocab_size": 7924,
6
+ "ssm_cfg": {
7
+ "layer": "Mamba2"
8
+ },
9
+ "attn_layer_idx": [],
10
+ "attn_cfg": {},
11
+ "rms_norm": true,
12
+ "residual_in_fp32": true,
13
+ "fused_add_norm": true,
14
+ "pad_vocab_size_multiple": 8,
15
+ "tie_embeddings": true
16
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f1c202f071178d2740975322b9c084ebaba7364107511a4d066bf30b2294373
3
+ size 266076579
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45517b89a1aee212e1d861dc5a3c0d158a903c9920a3af9b18fcdb38ab667c1c
3
+ size 249879058
vocab.json ADDED
The diff for this file is too large to render. See raw diff