montalte_math_think_dataavailable_ls / localize_stitch_single_info.json
modrill's picture
Add files using upload-large-folder tool
15bf728 verified
{
"base_model": "Qwen/Qwen3-4B-Base",
"ft_model": "Montalte/math_think",
"task_name": "math",
"sample_size": 64,
"effective_sample_size": 64,
"n_epochs": 10,
"sparsity": 0.1,
"sigmoid_bias": 3.0,
"lr": 10000000.0,
"l1_strength": 1e-05,
"max_length": 2048,
"dataless": false,
"mask_ratio": 0.10625616340344946,
"save_merged_model": true,
"algorithm": "repo_exact_localizer_train_mask"
}