{ "timestamp": "2026-03-08T08:45:18.769911", "command_line_args": { "base_model": "Qwen/Qwen3-4B-Base", "ft_model": "/work8/yizhanh/0444_global_step_285_hf", "save_path": "/work8/yizhanh/mhm/MergeBench/math_rl", "task_name": "math", "sparsity": 0.1, "sigmoid_bias": 3.0, "lr": 100000000.0, "n_epochs": 1, "l1_strength": 0.0, "gpu_id": 5, "sample_size": 100 }, "actual_results": { "actual_sparsity": 0.1026563279741487, "target_sparsity": 0.1, "mask_proportion": 0.1026563279741487, "dataset_size": 100 }, "task_similarity": { "masked_energy_ratio": 0.9903082846604907, "cosine_similarity_in_mask_region": -2.3204116587294266e-05, "mask_coverage_ratio": 0.1026563279741487, "task_vector_l2_norm": 1.0, "masked_l2_norm": 0.9903082847595215, "unmasked_l2_norm": 0.43302464485168457 }, "graft_args": { "sparsity": 0.1, "sigmoid_bias": 3.0, "lr": 100000000.0, "num_train_epochs": 1, "l1_strength": 0.0 }, "task_similarity_between_models": { "jaccard_similarity": 0.369397455060345, "intersection_size": 306181056, "union_size": 828866176, "mask_1_size": 373003008, "mask_2_size": 762044288, "intersection_ratio_mask1": 0.8208541202970674, "intersection_ratio_mask2": 0.4017890571735379, "avg_intersection_ratio": 0.6113215887353026 } }