File size: 475 Bytes
7b5db6e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
{
  "base_model": "/root/affine-cortex/models",
  "output_dir": "./trained_model",
  "lora_r": 32,
  "lora_alpha": 64,
  "lora_dropout": 0.05,
  "stage1_epochs": 1,
  "stage1_lr": 0.0002,
  "stage1_batch_size": 2,
  "stage1_grad_accum": 8,
  "stage2_epochs": 1,
  "stage2_lr": 0.0001,
  "stage2_batch_size": 2,
  "stage2_grad_accum": 8,
  "max_length": 8192,
  "warmup_ratio": 0.03,
  "weight_decay": 0.01,
  "max_grad_norm": 1.0,
  "save_steps": 500,
  "logging_steps": 10
}