broadfield-dev's picture
Duplicate from broadfield-dev/savant_2_gsm8k_final
07aa2fb verified
raw
history blame contribute delete
461 Bytes
{
"repo_id": "broadfield-dev/savant_2_gsm8k_final",
"resume_from_benchmark": "",
"benchmark_name_prefix": "stable-run",
"benchmark_interval": 20,
"sft_epochs": 4,
"sft_lr": 2e-05,
"sft_warmup_proportion": 0.1,
"rl_lr": 1.5e-06,
"sft_slice": "0:2000",
"rl_slice": "4000:7473",
"context_length": 1024,
"base_model_name": "distilgpt2",
"use_scheduler": true,
"sft_batch_size": 1,
"grad_accum_steps": 16
}