valcore commited on
Commit
3f81aab
·
verified ·
1 Parent(s): 7fd76e6

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +23 -0
config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name": "Qwen/Qwen3-0.6B",
3
+ "num_heads": 4,
4
+ "head_layer_indices": [
5
+ 5,
6
+ 11,
7
+ 16,
8
+ 22
9
+ ],
10
+ "quantization": "none",
11
+ "hidden_size": 1024,
12
+ "vocab_size": 151936,
13
+ "num_hidden_layers": 28,
14
+ "training_config": {
15
+ "dataset_name": "wikitext",
16
+ "dataset_config_name": "wikitext-2-raw-v1",
17
+ "batch_size": 4,
18
+ "gradient_accumulation_steps": 32,
19
+ "max_steps": 500,
20
+ "lr": 0.005,
21
+ "max_length": 512
22
+ }
23
+ }