Transformers
alplusplus commited on
Commit
7932211
·
verified ·
1 Parent(s): adfe8de

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +20 -0
config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "vocab_size": 50257,
3
+ "d_model": 512,
4
+ "n_layers": 8,
5
+ "n_heads": 8,
6
+ "d_latent": 128,
7
+ "n_bits": 3,
8
+ "d_rope": 16,
9
+ "fff_depth": 2,
10
+ "max_seq_len": 2048,
11
+ "batch_size": 8,
12
+ "lr": 0.0003,
13
+ "total_steps": 10000,
14
+ "warmup_steps": 500,
15
+ "grad_clip": 1.0,
16
+ "tokens_target": 100000000,
17
+ "log_every": 50,
18
+ "save_every": 1000,
19
+ "hf_repo": "alplusplus/maple-attn-test"
20
+ }