montalte_code_think_dataavailable_fullval_e1_ls / localize_stitch_single_info.json
modrill's picture
Add files using upload-large-folder tool
bb4a137 verified
{
"base_model": "Qwen/Qwen3-4B-Base",
"ft_model": "Montalte/code_think",
"task_name": "coding",
"sample_size": null,
"effective_sample_size": 1000,
"n_epochs": 1,
"sparsity": 0.1,
"sigmoid_bias": 3.0,
"lr": 100000000.0,
"l1_strength": 0.0,
"max_length": 2048,
"dataless": false,
"mask_ratio": 0.10003264676216547,
"save_merged_model": true,
"algorithm": "repo_exact_localizer_train_mask"
}