yotsubian commited on
Commit
ed59074
·
verified ·
1 Parent(s): b196674

Upload config_exp1.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. config_exp1.yaml +40 -0
config_exp1.yaml ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ name: "Qwen/Qwen3-4B-Instruct-2507"
3
+ torch_dtype: "bfloat16"
4
+ trust_remote_code: false
5
+
6
+ lora:
7
+ r: 16
8
+ lora_alpha: 32
9
+ target_modules: ["q_proj", "v_proj", "k_proj", "o_proj"]
10
+ lora_dropout: 0.05
11
+ bias: "none"
12
+
13
+ training:
14
+ num_epochs: 3
15
+ per_device_batch_size: 2
16
+ gradient_accumulation_steps: 3
17
+ learning_rate: 0.0002
18
+ lr_scheduler: "cosine"
19
+ warmup_ratio: 0.05
20
+ bf16: true
21
+ gradient_checkpointing: false
22
+ logging_steps: 20
23
+ save_strategy: "epoch"
24
+ save_total_limit: 3
25
+ max_length: 1024
26
+
27
+ generation:
28
+ max_new_tokens: 512
29
+ temperature: 1.0
30
+ n_samples: 32
31
+
32
+ paths:
33
+ checkpoint_dir: "checkpoints/"
34
+ results_dir: "results/"
35
+ data_dir: "data/"
36
+
37
+ lean_server:
38
+ url: "http://localhost:8000"
39
+ timeout: 60
40
+ max_workers: 32