Trinity-337B-W4A16 / dequant_verification.json
0xSero's picture
W4A16 RTN quantization (216/256 experts, 166GB)
8032f24 verified
{
"layers": [
{
"label": "dense_mlp_L0",
"layer": "model.layers.0.mlp.gate_proj",
"snr_db": 8.8,
"cosine": 0.942961,
"mae": 0.001491
},
{
"label": "dense_mlp_L2",
"layer": "model.layers.2.mlp.gate_proj",
"snr_db": 9.0,
"cosine": 0.946257,
"mae": 0.001487
},
{
"label": "dense_mlp_L5",
"layer": "model.layers.5.mlp.gate_proj",
"snr_db": 9.1,
"cosine": 0.946178,
"mae": 0.001739
},
{
"label": "moe_L6_E0",
"layer": "model.layers.6.mlp.experts.0.gate_proj",
"snr_db": 8.6,
"cosine": 0.936454,
"mae": 0.001716
},
{
"label": "moe_L6_E100",
"layer": "model.layers.6.mlp.experts.100.gate_proj",
"snr_db": 8.6,
"cosine": 0.936431,
"mae": 0.001703
},
{
"label": "moe_L30_E0",
"layer": "model.layers.30.mlp.experts.0.gate_proj",
"snr_db": 8.6,
"cosine": 0.936316,
"mae": 0.001769
},
{
"label": "moe_L30_E100",
"layer": "model.layers.30.mlp.experts.100.gate_proj",
"snr_db": 8.6,
"cosine": 0.93641,
"mae": 0.001734
},
{
"label": "moe_L59_E0",
"layer": "model.layers.59.mlp.experts.0.gate_proj",
"snr_db": 8.6,
"cosine": 0.936509,
"mae": 0.001727
},
{
"label": "moe_L59_E100",
"layer": "model.layers.59.mlp.experts.100.gate_proj",
"snr_db": 8.6,
"cosine": 0.936509,
"mae": 0.001688
}
],
"avg_snr_db": 8.7,
"avg_cosine": 0.9393
}