aneeshm44's picture
Upload pruning_summary.json with huggingface_hub
7271828 verified
{
"source_model_path": "/data/aneesh/gpt_oss_120b",
"mapping_path": "/data/aneesh/aimo/pruning/mappings/expert_mapping_120b_mxfp4_new_large.json",
"save_path": "models/threshold_99",
"threshold": 99.0,
"num_layers": 36,
"num_output_shards": 15,
"written_tensor_count": 687,
"pruned_tensor_count": 288,
"copied_tensor_count": 399,
"layer_stats": [
{
"layer": 0,
"total_experts": 128,
"needed": 120,
"pct_used": 93.75,
"never_used": 0
},
{
"layer": 1,
"total_experts": 128,
"needed": 116,
"pct_used": 90.625,
"never_used": 0
},
{
"layer": 2,
"total_experts": 128,
"needed": 111,
"pct_used": 86.71875,
"never_used": 0
},
{
"layer": 3,
"total_experts": 128,
"needed": 109,
"pct_used": 85.15625,
"never_used": 0
},
{
"layer": 4,
"total_experts": 128,
"needed": 110,
"pct_used": 85.9375,
"never_used": 0
},
{
"layer": 5,
"total_experts": 128,
"needed": 114,
"pct_used": 89.0625,
"never_used": 0
},
{
"layer": 6,
"total_experts": 128,
"needed": 114,
"pct_used": 89.0625,
"never_used": 0
},
{
"layer": 7,
"total_experts": 128,
"needed": 110,
"pct_used": 85.9375,
"never_used": 0
},
{
"layer": 8,
"total_experts": 128,
"needed": 109,
"pct_used": 85.15625,
"never_used": 0
},
{
"layer": 9,
"total_experts": 128,
"needed": 108,
"pct_used": 84.375,
"never_used": 0
},
{
"layer": 10,
"total_experts": 128,
"needed": 102,
"pct_used": 79.6875,
"never_used": 0
},
{
"layer": 11,
"total_experts": 128,
"needed": 93,
"pct_used": 72.65625,
"never_used": 0
},
{
"layer": 12,
"total_experts": 128,
"needed": 104,
"pct_used": 81.25,
"never_used": 0
},
{
"layer": 13,
"total_experts": 128,
"needed": 98,
"pct_used": 76.5625,
"never_used": 0
},
{
"layer": 14,
"total_experts": 128,
"needed": 107,
"pct_used": 83.59375,
"never_used": 0
},
{
"layer": 15,
"total_experts": 128,
"needed": 108,
"pct_used": 84.375,
"never_used": 0
},
{
"layer": 16,
"total_experts": 128,
"needed": 107,
"pct_used": 83.59375,
"never_used": 0
},
{
"layer": 17,
"total_experts": 128,
"needed": 108,
"pct_used": 84.375,
"never_used": 0
},
{
"layer": 18,
"total_experts": 128,
"needed": 109,
"pct_used": 85.15625,
"never_used": 0
},
{
"layer": 19,
"total_experts": 128,
"needed": 107,
"pct_used": 83.59375,
"never_used": 0
},
{
"layer": 20,
"total_experts": 128,
"needed": 110,
"pct_used": 85.9375,
"never_used": 0
},
{
"layer": 21,
"total_experts": 128,
"needed": 108,
"pct_used": 84.375,
"never_used": 0
},
{
"layer": 22,
"total_experts": 128,
"needed": 112,
"pct_used": 87.5,
"never_used": 0
},
{
"layer": 23,
"total_experts": 128,
"needed": 108,
"pct_used": 84.375,
"never_used": 0
},
{
"layer": 24,
"total_experts": 128,
"needed": 109,
"pct_used": 85.15625,
"never_used": 0
},
{
"layer": 25,
"total_experts": 128,
"needed": 108,
"pct_used": 84.375,
"never_used": 0
},
{
"layer": 26,
"total_experts": 128,
"needed": 109,
"pct_used": 85.15625,
"never_used": 0
},
{
"layer": 27,
"total_experts": 128,
"needed": 109,
"pct_used": 85.15625,
"never_used": 0
},
{
"layer": 28,
"total_experts": 128,
"needed": 105,
"pct_used": 82.03125,
"never_used": 0
},
{
"layer": 29,
"total_experts": 128,
"needed": 108,
"pct_used": 84.375,
"never_used": 0
},
{
"layer": 30,
"total_experts": 128,
"needed": 111,
"pct_used": 86.71875,
"never_used": 0
},
{
"layer": 31,
"total_experts": 128,
"needed": 119,
"pct_used": 92.96875,
"never_used": 0
},
{
"layer": 32,
"total_experts": 128,
"needed": 110,
"pct_used": 85.9375,
"never_used": 0
},
{
"layer": 33,
"total_experts": 128,
"needed": 103,
"pct_used": 80.46875,
"never_used": 0
},
{
"layer": 34,
"total_experts": 128,
"needed": 103,
"pct_used": 80.46875,
"never_used": 0
},
{
"layer": 35,
"total_experts": 128,
"needed": 90,
"pct_used": 70.3125,
"never_used": 1
}
]
}