jacobcd52 commited on
Commit
768506b
·
verified ·
1 Parent(s): 7dbdd1f

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +30 -0
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_config": {
3
+ "n_layer": 4,
4
+ "d_model": 512,
5
+ "n_ctx": 512,
6
+ "d_head": 16,
7
+ "d_mlp": 2048,
8
+ "vocab_size": 4096,
9
+ "use_rms_norm": true,
10
+ "tie_embeddings": false,
11
+ "use_positional_embeddings": false,
12
+ "use_bigram_table": false,
13
+ "use_attention_sinks": true,
14
+ "activation": "gelu",
15
+ "dropout": 0.0,
16
+ "use_bias": true
17
+ },
18
+ "sparsity_config": {
19
+ "enable_weight_sparsity": false,
20
+ "target_l0_fraction": 1,
21
+ "enable_activation_sparsity": false,
22
+ "activation_topk_fraction": 0.25
23
+ },
24
+ "training_config": {
25
+ "total_tokens": 2000000000,
26
+ "batch_size": 128,
27
+ "dataset_name": "SimpleStories/SimpleStories",
28
+ "tokenizer_name": "SimpleStories/SimpleStories-1.25M"
29
+ }
30
+ }