xiaohy commited on
Commit
6c351a4
·
verified ·
1 Parent(s): 0c40d4d

Upload config.json

Browse files
Files changed (1) hide show
  1. config.json +40 -0
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name": "Qwen/Qwen2.5-Math-1.5B-Instruct",
3
+ "lora_r": 8,
4
+ "lora_alpha": 16,
5
+ "lora_dropout": 0.05,
6
+ "target_modules": [
7
+ "q_proj",
8
+ "k_proj",
9
+ "v_proj",
10
+ "o_proj"
11
+ ],
12
+ "num_train_epochs": 10,
13
+ "per_device_train_batch_size": 2,
14
+ "gradient_accumulation_steps": 8,
15
+ "learning_rate": 0.0002,
16
+ "lr_scheduler_type": "cosine",
17
+ "warmup_ratio": 0.05,
18
+ "weight_decay": 0.01,
19
+ "fp16": true,
20
+ "max_seq_length": 512,
21
+ "label_smoothing_configs": [
22
+ 0.0,
23
+ 0.02,
24
+ 0.05,
25
+ 0.1,
26
+ 0.2
27
+ ],
28
+ "perturbation_sigmas": [
29
+ 0.005,
30
+ 0.01,
31
+ 0.015,
32
+ 0.02,
33
+ 0.025,
34
+ 0.03
35
+ ],
36
+ "data_seed": 42,
37
+ "data_size": 2000,
38
+ "eval_questions": 300,
39
+ "created_at": "2026-03-11 17:52:45"
40
+ }