montalte_code_think_dataavailable_ls / localize_stitch_single_info.json
modrill's picture
Add files using upload-large-folder tool
d92746e verified
{
"base_model": "Qwen/Qwen3-4B-Base",
"ft_model": "Montalte/code_think",
"task_name": "coding",
"sample_size": 64,
"effective_sample_size": 64,
"n_epochs": 10,
"sparsity": 0.1,
"sigmoid_bias": 3.0,
"lr": 10000000.0,
"l1_strength": 1e-05,
"max_length": 2048,
"dataless": false,
"mask_ratio": 0.10025214239450347,
"save_merged_model": true,
"algorithm": "repo_exact_localizer_train_mask"
}