File size: 1,388 Bytes
3ffbf41 725a0e7 3ffbf41 725a0e7 3ffbf41 725a0e7 3ffbf41 725a0e7 3ffbf41 725a0e7 3ffbf41 725a0e7 3ffbf41 725a0e7 3ffbf41 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 | {
"timestamp": "2026-03-08T08:45:18.769911",
"command_line_args": {
"base_model": "Qwen/Qwen3-4B-Base",
"ft_model": "/work8/yizhanh/0444_global_step_285_hf",
"save_path": "/work8/yizhanh/mhm/MergeBench/math_rl",
"task_name": "math",
"sparsity": 0.1,
"sigmoid_bias": 3.0,
"lr": 100000000.0,
"n_epochs": 1,
"l1_strength": 0.0,
"gpu_id": 5,
"sample_size": 100
},
"actual_results": {
"actual_sparsity": 0.1026563279741487,
"target_sparsity": 0.1,
"mask_proportion": 0.1026563279741487,
"dataset_size": 100
},
"task_similarity": {
"masked_energy_ratio": 0.9903082846604907,
"cosine_similarity_in_mask_region": -2.3204116587294266e-05,
"mask_coverage_ratio": 0.1026563279741487,
"task_vector_l2_norm": 1.0,
"masked_l2_norm": 0.9903082847595215,
"unmasked_l2_norm": 0.43302464485168457
},
"graft_args": {
"sparsity": 0.1,
"sigmoid_bias": 3.0,
"lr": 100000000.0,
"num_train_epochs": 1,
"l1_strength": 0.0
},
"task_similarity_between_models": {
"jaccard_similarity": 0.369397455060345,
"intersection_size": 306181056,
"union_size": 828866176,
"mask_1_size": 373003008,
"mask_2_size": 762044288,
"intersection_ratio_mask1": 0.8208541202970674,
"intersection_ratio_mask2": 0.4017890571735379,
"avg_intersection_ratio": 0.6113215887353026
}
} |