File size: 461 Bytes
07aa2fb
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
{
    "repo_id": "broadfield-dev/savant_2_gsm8k_final",
    "resume_from_benchmark": "",
    "benchmark_name_prefix": "stable-run",
    "benchmark_interval": 20,
    "sft_epochs": 4,
    "sft_lr": 2e-05,
    "sft_warmup_proportion": 0.1,
    "rl_lr": 1.5e-06,
    "sft_slice": "0:2000",
    "rl_slice": "4000:7473",
    "context_length": 1024,
    "base_model_name": "distilgpt2",
    "use_scheduler": true,
    "sft_batch_size": 1,
    "grad_accum_steps": 16
}