Gemma-3-R1984-27B-EXL3 / measurement.json
Nekochu's picture
Add KLD measurement
9df4723 verified
{
"base": {
"dir": "D:\\main\\program\\AI\\CoridorGreenScreenMattingCPUfree\\tmp\\quants\\Gemma-3-R1984-27B-2.0bpw",
"bpw": 2.004435066344246
},
"alts": [
{
"dir": "D:\\main\\program\\AI\\CoridorGreenScreenMattingCPUfree\\tmp\\quants\\Gemma-3-R1984-27B-8.0bpw",
"bpw": 8.004435066344247
}
],
"groups": [
{
"idx": 0,
"layers": [
"language_model.model.layers.0.self_attn.q_proj",
"language_model.model.layers.0.self_attn.k_proj",
"language_model.model.layers.0.self_attn.v_proj",
"language_model.model.layers.0.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.006917499005794525,
"dbits": 396361728
}
]
},
{
"idx": 1,
"layers": [
"language_model.model.layers.0.mlp.gate_proj",
"language_model.model.layers.0.mlp.up_proj",
"language_model.model.layers.0.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.004495760053396247,
"dbits": 2080899072
}
]
},
{
"idx": 2,
"layers": [
"language_model.model.layers.1.self_attn.q_proj",
"language_model.model.layers.1.self_attn.k_proj",
"language_model.model.layers.1.self_attn.v_proj",
"language_model.model.layers.1.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0004842020571231842,
"dbits": 396361728
}
]
},
{
"idx": 3,
"layers": [
"language_model.model.layers.1.mlp.gate_proj",
"language_model.model.layers.1.mlp.up_proj",
"language_model.model.layers.1.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.005311993509531043,
"dbits": 2080899072
}
]
},
{
"idx": 4,
"layers": [
"language_model.model.layers.2.self_attn.q_proj",
"language_model.model.layers.2.self_attn.k_proj",
"language_model.model.layers.2.self_attn.v_proj",
"language_model.model.layers.2.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0011243283748627042,
"dbits": 396361728
}
]
},
{
"idx": 5,
"layers": [
"language_model.model.layers.2.mlp.gate_proj",
"language_model.model.layers.2.mlp.up_proj",
"language_model.model.layers.2.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.009011824429035198,
"dbits": 2080899072
}
]
},
{
"idx": 6,
"layers": [
"language_model.model.layers.3.self_attn.q_proj",
"language_model.model.layers.3.self_attn.k_proj",
"language_model.model.layers.3.self_attn.v_proj",
"language_model.model.layers.3.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.003413629531860307,
"dbits": 396361728
}
]
},
{
"idx": 7,
"layers": [
"language_model.model.layers.3.mlp.gate_proj",
"language_model.model.layers.3.mlp.up_proj",
"language_model.model.layers.3.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.006673009693622611,
"dbits": 2080899072
}
]
},
{
"idx": 8,
"layers": [
"language_model.model.layers.4.self_attn.q_proj",
"language_model.model.layers.4.self_attn.k_proj",
"language_model.model.layers.4.self_attn.v_proj",
"language_model.model.layers.4.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0005826622247695479,
"dbits": 396361728
}
]
},
{
"idx": 9,
"layers": [
"language_model.model.layers.4.mlp.gate_proj",
"language_model.model.layers.4.mlp.up_proj",
"language_model.model.layers.4.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0080329388380051,
"dbits": 2080899072
}
]
},
{
"idx": 10,
"layers": [
"language_model.model.layers.5.self_attn.q_proj",
"language_model.model.layers.5.self_attn.k_proj",
"language_model.model.layers.5.self_attn.v_proj",
"language_model.model.layers.5.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0023767203092575073,
"dbits": 396361728
}
]
},
{
"idx": 11,
"layers": [
"language_model.model.layers.5.mlp.gate_proj",
"language_model.model.layers.5.mlp.up_proj",
"language_model.model.layers.5.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.010135890543460868,
"dbits": 2080899072
}
]
},
{
"idx": 12,
"layers": [
"language_model.model.layers.6.self_attn.q_proj",
"language_model.model.layers.6.self_attn.k_proj",
"language_model.model.layers.6.self_attn.v_proj",
"language_model.model.layers.6.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0027037844061851835,
"dbits": 396361728
}
]
},
{
"idx": 13,
"layers": [
"language_model.model.layers.6.mlp.gate_proj",
"language_model.model.layers.6.mlp.up_proj",
"language_model.model.layers.6.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0041308201849460935,
"dbits": 2080899072
}
]
},
{
"idx": 14,
"layers": [
"language_model.model.layers.7.self_attn.q_proj",
"language_model.model.layers.7.self_attn.k_proj",
"language_model.model.layers.7.self_attn.v_proj",
"language_model.model.layers.7.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0014376796782016865,
"dbits": 396361728
}
]
},
{
"idx": 15,
"layers": [
"language_model.model.layers.7.mlp.gate_proj",
"language_model.model.layers.7.mlp.up_proj",
"language_model.model.layers.7.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.01197697520256047,
"dbits": 2080899072
}
]
},
{
"idx": 16,
"layers": [
"language_model.model.layers.8.self_attn.q_proj",
"language_model.model.layers.8.self_attn.k_proj",
"language_model.model.layers.8.self_attn.v_proj",
"language_model.model.layers.8.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0037170641124248394,
"dbits": 396361728
}
]
},
{
"idx": 17,
"layers": [
"language_model.model.layers.8.mlp.gate_proj",
"language_model.model.layers.8.mlp.up_proj",
"language_model.model.layers.8.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0004419878125190846,
"dbits": 2080899072
}
]
},
{
"idx": 18,
"layers": [
"language_model.model.layers.9.self_attn.q_proj",
"language_model.model.layers.9.self_attn.k_proj",
"language_model.model.layers.9.self_attn.v_proj",
"language_model.model.layers.9.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.004326772689819347,
"dbits": 396361728
}
]
},
{
"idx": 19,
"layers": [
"language_model.model.layers.9.mlp.gate_proj",
"language_model.model.layers.9.mlp.up_proj",
"language_model.model.layers.9.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.010839792340993915,
"dbits": 2080899072
}
]
},
{
"idx": 20,
"layers": [
"language_model.model.layers.10.self_attn.q_proj",
"language_model.model.layers.10.self_attn.k_proj",
"language_model.model.layers.10.self_attn.v_proj",
"language_model.model.layers.10.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.009040921181440398,
"dbits": 396361728
}
]
},
{
"idx": 21,
"layers": [
"language_model.model.layers.10.mlp.gate_proj",
"language_model.model.layers.10.mlp.up_proj",
"language_model.model.layers.10.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.031036542356014274,
"dbits": 2080899072
}
]
},
{
"idx": 22,
"layers": [
"language_model.model.layers.11.self_attn.q_proj",
"language_model.model.layers.11.self_attn.k_proj",
"language_model.model.layers.11.self_attn.v_proj",
"language_model.model.layers.11.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.00979023426771164,
"dbits": 396361728
}
]
},
{
"idx": 23,
"layers": [
"language_model.model.layers.11.mlp.gate_proj",
"language_model.model.layers.11.mlp.up_proj",
"language_model.model.layers.11.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.007736762613058112,
"dbits": 2080899072
}
]
},
{
"idx": 24,
"layers": [
"language_model.model.layers.12.self_attn.q_proj",
"language_model.model.layers.12.self_attn.k_proj",
"language_model.model.layers.12.self_attn.v_proj",
"language_model.model.layers.12.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.003069894015789054,
"dbits": 396361728
}
]
},
{
"idx": 25,
"layers": [
"language_model.model.layers.12.mlp.gate_proj",
"language_model.model.layers.12.mlp.up_proj",
"language_model.model.layers.12.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.014686931669712078,
"dbits": 2080899072
}
]
},
{
"idx": 26,
"layers": [
"language_model.model.layers.13.self_attn.q_proj",
"language_model.model.layers.13.self_attn.k_proj",
"language_model.model.layers.13.self_attn.v_proj",
"language_model.model.layers.13.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.000129348039627053,
"dbits": 396361728
}
]
},
{
"idx": 27,
"layers": [
"language_model.model.layers.13.mlp.gate_proj",
"language_model.model.layers.13.mlp.up_proj",
"language_model.model.layers.13.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.003941317647695564,
"dbits": 2080899072
}
]
},
{
"idx": 28,
"layers": [
"language_model.model.layers.14.self_attn.q_proj",
"language_model.model.layers.14.self_attn.k_proj",
"language_model.model.layers.14.self_attn.v_proj",
"language_model.model.layers.14.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0035466991364956346,
"dbits": 396361728
}
]
},
{
"idx": 29,
"layers": [
"language_model.model.layers.14.mlp.gate_proj",
"language_model.model.layers.14.mlp.up_proj",
"language_model.model.layers.14.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.022119185328483615,
"dbits": 2080899072
}
]
},
{
"idx": 30,
"layers": [
"language_model.model.layers.15.self_attn.q_proj",
"language_model.model.layers.15.self_attn.k_proj",
"language_model.model.layers.15.self_attn.v_proj",
"language_model.model.layers.15.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.003810518234968141,
"dbits": 396361728
}
]
},
{
"idx": 31,
"layers": [
"language_model.model.layers.15.mlp.gate_proj",
"language_model.model.layers.15.mlp.up_proj",
"language_model.model.layers.15.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.009127749502658877,
"dbits": 2080899072
}
]
},
{
"idx": 32,
"layers": [
"language_model.model.layers.16.self_attn.q_proj",
"language_model.model.layers.16.self_attn.k_proj",
"language_model.model.layers.16.self_attn.v_proj",
"language_model.model.layers.16.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.006637018173933029,
"dbits": 396361728
}
]
},
{
"idx": 33,
"layers": [
"language_model.model.layers.16.mlp.gate_proj",
"language_model.model.layers.16.mlp.up_proj",
"language_model.model.layers.16.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.021292066574096713,
"dbits": 2080899072
}
]
},
{
"idx": 34,
"layers": [
"language_model.model.layers.17.self_attn.q_proj",
"language_model.model.layers.17.self_attn.k_proj",
"language_model.model.layers.17.self_attn.v_proj",
"language_model.model.layers.17.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0025063112378120866,
"dbits": 396361728
}
]
},
{
"idx": 35,
"layers": [
"language_model.model.layers.17.mlp.gate_proj",
"language_model.model.layers.17.mlp.up_proj",
"language_model.model.layers.17.mlp.down_proj"
],
"candidates": [
{
"dkld": 0.0022593840956687816,
"dbits": 2080899072
}
]
},
{
"idx": 36,
"layers": [
"language_model.model.layers.18.self_attn.q_proj",
"language_model.model.layers.18.self_attn.k_proj",
"language_model.model.layers.18.self_attn.v_proj",
"language_model.model.layers.18.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.002482272684574127,
"dbits": 396361728
}
]
},
{
"idx": 37,
"layers": [
"language_model.model.layers.18.mlp.gate_proj",
"language_model.model.layers.18.mlp.up_proj",
"language_model.model.layers.18.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.000394851714372646,
"dbits": 2080899072
}
]
},
{
"idx": 38,
"layers": [
"language_model.model.layers.19.self_attn.q_proj",
"language_model.model.layers.19.self_attn.k_proj",
"language_model.model.layers.19.self_attn.v_proj",
"language_model.model.layers.19.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0010013014078140703,
"dbits": 396361728
}
]
},
{
"idx": 39,
"layers": [
"language_model.model.layers.19.mlp.gate_proj",
"language_model.model.layers.19.mlp.up_proj",
"language_model.model.layers.19.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.020440497994422935,
"dbits": 2080899072
}
]
},
{
"idx": 40,
"layers": [
"language_model.model.layers.20.self_attn.q_proj",
"language_model.model.layers.20.self_attn.k_proj",
"language_model.model.layers.20.self_attn.v_proj",
"language_model.model.layers.20.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.004292172193527177,
"dbits": 396361728
}
]
},
{
"idx": 41,
"layers": [
"language_model.model.layers.20.mlp.gate_proj",
"language_model.model.layers.20.mlp.up_proj",
"language_model.model.layers.20.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0009037740528583527,
"dbits": 2080899072
}
]
},
{
"idx": 42,
"layers": [
"language_model.model.layers.21.self_attn.q_proj",
"language_model.model.layers.21.self_attn.k_proj",
"language_model.model.layers.21.self_attn.v_proj",
"language_model.model.layers.21.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.006902486085891724,
"dbits": 396361728
}
]
},
{
"idx": 43,
"layers": [
"language_model.model.layers.21.mlp.gate_proj",
"language_model.model.layers.21.mlp.up_proj",
"language_model.model.layers.21.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.00929136574268341,
"dbits": 2080899072
}
]
},
{
"idx": 44,
"layers": [
"language_model.model.layers.22.self_attn.q_proj",
"language_model.model.layers.22.self_attn.k_proj",
"language_model.model.layers.22.self_attn.v_proj",
"language_model.model.layers.22.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0036064453423023113,
"dbits": 396361728
}
]
},
{
"idx": 45,
"layers": [
"language_model.model.layers.22.mlp.gate_proj",
"language_model.model.layers.22.mlp.up_proj",
"language_model.model.layers.22.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0006043247878551594,
"dbits": 2080899072
}
]
},
{
"idx": 46,
"layers": [
"language_model.model.layers.23.self_attn.q_proj",
"language_model.model.layers.23.self_attn.k_proj",
"language_model.model.layers.23.self_attn.v_proj",
"language_model.model.layers.23.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.028081689029932022,
"dbits": 396361728
}
]
},
{
"idx": 47,
"layers": [
"language_model.model.layers.23.mlp.gate_proj",
"language_model.model.layers.23.mlp.up_proj",
"language_model.model.layers.23.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.00137981697916989,
"dbits": 2080899072
}
]
},
{
"idx": 48,
"layers": [
"language_model.model.layers.24.self_attn.q_proj",
"language_model.model.layers.24.self_attn.k_proj",
"language_model.model.layers.24.self_attn.v_proj",
"language_model.model.layers.24.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0014152429997921212,
"dbits": 396361728
}
]
},
{
"idx": 49,
"layers": [
"language_model.model.layers.24.mlp.gate_proj",
"language_model.model.layers.24.mlp.up_proj",
"language_model.model.layers.24.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.004900486022233974,
"dbits": 2080899072
}
]
},
{
"idx": 50,
"layers": [
"language_model.model.layers.25.self_attn.q_proj",
"language_model.model.layers.25.self_attn.k_proj",
"language_model.model.layers.25.self_attn.v_proj",
"language_model.model.layers.25.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.008432538062334072,
"dbits": 396361728
}
]
},
{
"idx": 51,
"layers": [
"language_model.model.layers.25.mlp.gate_proj",
"language_model.model.layers.25.mlp.up_proj",
"language_model.model.layers.25.mlp.down_proj"
],
"candidates": [
{
"dkld": 0.005563641339540459,
"dbits": 2080899072
}
]
},
{
"idx": 52,
"layers": [
"language_model.model.layers.26.self_attn.q_proj",
"language_model.model.layers.26.self_attn.k_proj",
"language_model.model.layers.26.self_attn.v_proj",
"language_model.model.layers.26.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.010603216290473949,
"dbits": 396361728
}
]
},
{
"idx": 53,
"layers": [
"language_model.model.layers.26.mlp.gate_proj",
"language_model.model.layers.26.mlp.up_proj",
"language_model.model.layers.26.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.003027988225221656,
"dbits": 2080899072
}
]
},
{
"idx": 54,
"layers": [
"language_model.model.layers.27.self_attn.q_proj",
"language_model.model.layers.27.self_attn.k_proj",
"language_model.model.layers.27.self_attn.v_proj",
"language_model.model.layers.27.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.00233266279101374,
"dbits": 396361728
}
]
},
{
"idx": 55,
"layers": [
"language_model.model.layers.27.mlp.gate_proj",
"language_model.model.layers.27.mlp.up_proj",
"language_model.model.layers.27.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0059184454381466245,
"dbits": 2080899072
}
]
},
{
"idx": 56,
"layers": [
"language_model.model.layers.28.self_attn.q_proj",
"language_model.model.layers.28.self_attn.k_proj",
"language_model.model.layers.28.self_attn.v_proj",
"language_model.model.layers.28.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0004229128360748735,
"dbits": 396361728
}
]
},
{
"idx": 57,
"layers": [
"language_model.model.layers.28.mlp.gate_proj",
"language_model.model.layers.28.mlp.up_proj",
"language_model.model.layers.28.mlp.down_proj"
],
"candidates": [
{
"dkld": 0.007507449388504006,
"dbits": 2080899072
}
]
},
{
"idx": 58,
"layers": [
"language_model.model.layers.29.self_attn.q_proj",
"language_model.model.layers.29.self_attn.k_proj",
"language_model.model.layers.29.self_attn.v_proj",
"language_model.model.layers.29.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0012179315090179443,
"dbits": 396361728
}
]
},
{
"idx": 59,
"layers": [
"language_model.model.layers.29.mlp.gate_proj",
"language_model.model.layers.29.mlp.up_proj",
"language_model.model.layers.29.mlp.down_proj"
],
"candidates": [
{
"dkld": 0.007656254619359926,
"dbits": 2080899072
}
]
},
{
"idx": 60,
"layers": [
"language_model.model.layers.30.self_attn.q_proj",
"language_model.model.layers.30.self_attn.k_proj",
"language_model.model.layers.30.self_attn.v_proj",
"language_model.model.layers.30.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0006962120532989502,
"dbits": 396361728
}
]
},
{
"idx": 61,
"layers": [
"language_model.model.layers.30.mlp.gate_proj",
"language_model.model.layers.30.mlp.up_proj",
"language_model.model.layers.30.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0112728171050549,
"dbits": 2080899072
}
]
},
{
"idx": 62,
"layers": [
"language_model.model.layers.31.self_attn.q_proj",
"language_model.model.layers.31.self_attn.k_proj",
"language_model.model.layers.31.self_attn.v_proj",
"language_model.model.layers.31.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0017989106476307137,
"dbits": 396361728
}
]
},
{
"idx": 63,
"layers": [
"language_model.model.layers.31.mlp.gate_proj",
"language_model.model.layers.31.mlp.up_proj",
"language_model.model.layers.31.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0063770614564419015,
"dbits": 2080899072
}
]
},
{
"idx": 64,
"layers": [
"language_model.model.layers.32.self_attn.q_proj",
"language_model.model.layers.32.self_attn.k_proj",
"language_model.model.layers.32.self_attn.v_proj",
"language_model.model.layers.32.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.00029214099049568176,
"dbits": 396361728
}
]
},
{
"idx": 65,
"layers": [
"language_model.model.layers.32.mlp.gate_proj",
"language_model.model.layers.32.mlp.up_proj",
"language_model.model.layers.32.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.006251434981823012,
"dbits": 2080899072
}
]
},
{
"idx": 66,
"layers": [
"language_model.model.layers.33.self_attn.q_proj",
"language_model.model.layers.33.self_attn.k_proj",
"language_model.model.layers.33.self_attn.v_proj",
"language_model.model.layers.33.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0005352959036826754,
"dbits": 396361728
}
]
},
{
"idx": 67,
"layers": [
"language_model.model.layers.33.mlp.gate_proj",
"language_model.model.layers.33.mlp.up_proj",
"language_model.model.layers.33.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.005572766810655605,
"dbits": 2080899072
}
]
},
{
"idx": 68,
"layers": [
"language_model.model.layers.34.self_attn.q_proj",
"language_model.model.layers.34.self_attn.k_proj",
"language_model.model.layers.34.self_attn.v_proj",
"language_model.model.layers.34.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0008197985589504242,
"dbits": 396361728
}
]
},
{
"idx": 69,
"layers": [
"language_model.model.layers.34.mlp.gate_proj",
"language_model.model.layers.34.mlp.up_proj",
"language_model.model.layers.34.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.004082408547401439,
"dbits": 2080899072
}
]
},
{
"idx": 70,
"layers": [
"language_model.model.layers.35.self_attn.q_proj",
"language_model.model.layers.35.self_attn.k_proj",
"language_model.model.layers.35.self_attn.v_proj",
"language_model.model.layers.35.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0032249547541141066,
"dbits": 396361728
}
]
},
{
"idx": 71,
"layers": [
"language_model.model.layers.35.mlp.gate_proj",
"language_model.model.layers.35.mlp.up_proj",
"language_model.model.layers.35.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0070062801241874695,
"dbits": 2080899072
}
]
},
{
"idx": 72,
"layers": [
"language_model.model.layers.36.self_attn.q_proj",
"language_model.model.layers.36.self_attn.k_proj",
"language_model.model.layers.36.self_attn.v_proj",
"language_model.model.layers.36.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0005763806402683258,
"dbits": 396361728
}
]
},
{
"idx": 73,
"layers": [
"language_model.model.layers.36.mlp.gate_proj",
"language_model.model.layers.36.mlp.up_proj",
"language_model.model.layers.36.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0030428156256676053,
"dbits": 2080899072
}
]
},
{
"idx": 74,
"layers": [
"language_model.model.layers.37.self_attn.q_proj",
"language_model.model.layers.37.self_attn.k_proj",
"language_model.model.layers.37.self_attn.v_proj",
"language_model.model.layers.37.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0029344171285629606,
"dbits": 396361728
}
]
},
{
"idx": 75,
"layers": [
"language_model.model.layers.37.mlp.gate_proj",
"language_model.model.layers.37.mlp.up_proj",
"language_model.model.layers.37.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.005395969003438972,
"dbits": 2080899072
}
]
},
{
"idx": 76,
"layers": [
"language_model.model.layers.38.self_attn.q_proj",
"language_model.model.layers.38.self_attn.k_proj",
"language_model.model.layers.38.self_attn.v_proj",
"language_model.model.layers.38.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0017978318035602459,
"dbits": 396361728
}
]
},
{
"idx": 77,
"layers": [
"language_model.model.layers.38.mlp.gate_proj",
"language_model.model.layers.38.mlp.up_proj",
"language_model.model.layers.38.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0036740973591804504,
"dbits": 2080899072
}
]
},
{
"idx": 78,
"layers": [
"language_model.model.layers.39.self_attn.q_proj",
"language_model.model.layers.39.self_attn.k_proj",
"language_model.model.layers.39.self_attn.v_proj",
"language_model.model.layers.39.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0005030691623687522,
"dbits": 396361728
}
]
},
{
"idx": 79,
"layers": [
"language_model.model.layers.39.mlp.gate_proj",
"language_model.model.layers.39.mlp.up_proj",
"language_model.model.layers.39.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.003146367520093951,
"dbits": 2080899072
}
]
},
{
"idx": 80,
"layers": [
"language_model.model.layers.40.self_attn.q_proj",
"language_model.model.layers.40.self_attn.k_proj",
"language_model.model.layers.40.self_attn.v_proj",
"language_model.model.layers.40.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.008280515670776367,
"dbits": 396361728
}
]
},
{
"idx": 81,
"layers": [
"language_model.model.layers.40.mlp.gate_proj",
"language_model.model.layers.40.mlp.up_proj",
"language_model.model.layers.40.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.004743161797523543,
"dbits": 2080899072
}
]
},
{
"idx": 82,
"layers": [
"language_model.model.layers.41.self_attn.q_proj",
"language_model.model.layers.41.self_attn.k_proj",
"language_model.model.layers.41.self_attn.v_proj",
"language_model.model.layers.41.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.015289445966482185,
"dbits": 396361728
}
]
},
{
"idx": 83,
"layers": [
"language_model.model.layers.41.mlp.gate_proj",
"language_model.model.layers.41.mlp.up_proj",
"language_model.model.layers.41.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.00837468057870866,
"dbits": 2080899072
}
]
},
{
"idx": 84,
"layers": [
"language_model.model.layers.42.self_attn.q_proj",
"language_model.model.layers.42.self_attn.k_proj",
"language_model.model.layers.42.self_attn.v_proj",
"language_model.model.layers.42.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0007713317871094194,
"dbits": 396361728
}
]
},
{
"idx": 85,
"layers": [
"language_model.model.layers.42.mlp.gate_proj",
"language_model.model.layers.42.mlp.up_proj",
"language_model.model.layers.42.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0034337289631367063,
"dbits": 2080899072
}
]
},
{
"idx": 86,
"layers": [
"language_model.model.layers.43.self_attn.q_proj",
"language_model.model.layers.43.self_attn.k_proj",
"language_model.model.layers.43.self_attn.v_proj",
"language_model.model.layers.43.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.00845300778746605,
"dbits": 396361728
}
]
},
{
"idx": 87,
"layers": [
"language_model.model.layers.43.mlp.gate_proj",
"language_model.model.layers.43.mlp.up_proj",
"language_model.model.layers.43.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.003721737116575252,
"dbits": 2080899072
}
]
},
{
"idx": 88,
"layers": [
"language_model.model.layers.44.self_attn.q_proj",
"language_model.model.layers.44.self_attn.k_proj",
"language_model.model.layers.44.self_attn.v_proj",
"language_model.model.layers.44.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0051841072738170735,
"dbits": 396361728
}
]
},
{
"idx": 89,
"layers": [
"language_model.model.layers.44.mlp.gate_proj",
"language_model.model.layers.44.mlp.up_proj",
"language_model.model.layers.44.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0031947255134582853,
"dbits": 2080899072
}
]
},
{
"idx": 90,
"layers": [
"language_model.model.layers.45.self_attn.q_proj",
"language_model.model.layers.45.self_attn.k_proj",
"language_model.model.layers.45.self_attn.v_proj",
"language_model.model.layers.45.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.001118142157793045,
"dbits": 396361728
}
]
},
{
"idx": 91,
"layers": [
"language_model.model.layers.45.mlp.gate_proj",
"language_model.model.layers.45.mlp.up_proj",
"language_model.model.layers.45.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0033696956932545152,
"dbits": 2080899072
}
]
},
{
"idx": 92,
"layers": [
"language_model.model.layers.46.self_attn.q_proj",
"language_model.model.layers.46.self_attn.k_proj",
"language_model.model.layers.46.self_attn.v_proj",
"language_model.model.layers.46.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0005463138222694397,
"dbits": 396361728
}
]
},
{
"idx": 93,
"layers": [
"language_model.model.layers.46.mlp.gate_proj",
"language_model.model.layers.46.mlp.up_proj",
"language_model.model.layers.46.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.006662502884864807,
"dbits": 2080899072
}
]
},
{
"idx": 94,
"layers": [
"language_model.model.layers.47.self_attn.q_proj",
"language_model.model.layers.47.self_attn.k_proj",
"language_model.model.layers.47.self_attn.v_proj",
"language_model.model.layers.47.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0023998439311981312,
"dbits": 396361728
}
]
},
{
"idx": 95,
"layers": [
"language_model.model.layers.47.mlp.gate_proj",
"language_model.model.layers.47.mlp.up_proj",
"language_model.model.layers.47.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.003466875106096279,
"dbits": 2080899072
}
]
},
{
"idx": 96,
"layers": [
"language_model.model.layers.48.self_attn.q_proj",
"language_model.model.layers.48.self_attn.k_proj",
"language_model.model.layers.48.self_attn.v_proj",
"language_model.model.layers.48.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.004037512093782447,
"dbits": 396361728
}
]
},
{
"idx": 97,
"layers": [
"language_model.model.layers.48.mlp.gate_proj",
"language_model.model.layers.48.mlp.up_proj",
"language_model.model.layers.48.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.003907855600118637,
"dbits": 2080899072
}
]
},
{
"idx": 98,
"layers": [
"language_model.model.layers.49.self_attn.q_proj",
"language_model.model.layers.49.self_attn.k_proj",
"language_model.model.layers.49.self_attn.v_proj",
"language_model.model.layers.49.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0028403460979462003,
"dbits": 396361728
}
]
},
{
"idx": 99,
"layers": [
"language_model.model.layers.49.mlp.gate_proj",
"language_model.model.layers.49.mlp.up_proj",
"language_model.model.layers.49.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.002681272476911578,
"dbits": 2080899072
}
]
},
{
"idx": 100,
"layers": [
"language_model.model.layers.50.self_attn.q_proj",
"language_model.model.layers.50.self_attn.k_proj",
"language_model.model.layers.50.self_attn.v_proj",
"language_model.model.layers.50.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0014717683196068254,
"dbits": 396361728
}
]
},
{
"idx": 101,
"layers": [
"language_model.model.layers.50.mlp.gate_proj",
"language_model.model.layers.50.mlp.up_proj",
"language_model.model.layers.50.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0033254854381084553,
"dbits": 2080899072
}
]
},
{
"idx": 102,
"layers": [
"language_model.model.layers.51.self_attn.q_proj",
"language_model.model.layers.51.self_attn.k_proj",
"language_model.model.layers.51.self_attn.v_proj",
"language_model.model.layers.51.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0007418908178806749,
"dbits": 396361728
}
]
},
{
"idx": 103,
"layers": [
"language_model.model.layers.51.mlp.gate_proj",
"language_model.model.layers.51.mlp.up_proj",
"language_model.model.layers.51.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0038238234817982164,
"dbits": 2080899072
}
]
},
{
"idx": 104,
"layers": [
"language_model.model.layers.52.self_attn.q_proj",
"language_model.model.layers.52.self_attn.k_proj",
"language_model.model.layers.52.self_attn.v_proj",
"language_model.model.layers.52.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0012986376881599648,
"dbits": 396361728
}
]
},
{
"idx": 105,
"layers": [
"language_model.model.layers.52.mlp.gate_proj",
"language_model.model.layers.52.mlp.up_proj",
"language_model.model.layers.52.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0018054209649562836,
"dbits": 2080899072
}
]
},
{
"idx": 106,
"layers": [
"language_model.model.layers.53.self_attn.q_proj",
"language_model.model.layers.53.self_attn.k_proj",
"language_model.model.layers.53.self_attn.v_proj",
"language_model.model.layers.53.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.004864251613616977,
"dbits": 396361728
}
]
},
{
"idx": 107,
"layers": [
"language_model.model.layers.53.mlp.gate_proj",
"language_model.model.layers.53.mlp.up_proj",
"language_model.model.layers.53.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0019967712461948506,
"dbits": 2080899072
}
]
},
{
"idx": 108,
"layers": [
"language_model.model.layers.54.self_attn.q_proj",
"language_model.model.layers.54.self_attn.k_proj",
"language_model.model.layers.54.self_attn.v_proj",
"language_model.model.layers.54.self_attn.o_proj"
],
"candidates": [
{
"dkld": -5.696490406992272e-05,
"dbits": 396361728
}
]
},
{
"idx": 109,
"layers": [
"language_model.model.layers.54.mlp.gate_proj",
"language_model.model.layers.54.mlp.up_proj",
"language_model.model.layers.54.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.0024598926305771096,
"dbits": 2080899072
}
]
},
{
"idx": 110,
"layers": [
"language_model.model.layers.55.self_attn.q_proj",
"language_model.model.layers.55.self_attn.k_proj",
"language_model.model.layers.55.self_attn.v_proj",
"language_model.model.layers.55.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0008994087576865706,
"dbits": 396361728
}
]
},
{
"idx": 111,
"layers": [
"language_model.model.layers.55.mlp.gate_proj",
"language_model.model.layers.55.mlp.up_proj",
"language_model.model.layers.55.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.003040955960750602,
"dbits": 2080899072
}
]
},
{
"idx": 112,
"layers": [
"language_model.model.layers.56.self_attn.q_proj",
"language_model.model.layers.56.self_attn.k_proj",
"language_model.model.layers.56.self_attn.v_proj",
"language_model.model.layers.56.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0004954591393471208,
"dbits": 396361728
}
]
},
{
"idx": 113,
"layers": [
"language_model.model.layers.56.mlp.gate_proj",
"language_model.model.layers.56.mlp.up_proj",
"language_model.model.layers.56.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.002797749638557445,
"dbits": 2080899072
}
]
},
{
"idx": 114,
"layers": [
"language_model.model.layers.57.self_attn.q_proj",
"language_model.model.layers.57.self_attn.k_proj",
"language_model.model.layers.57.self_attn.v_proj",
"language_model.model.layers.57.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0017556458711624479,
"dbits": 396361728
}
]
},
{
"idx": 115,
"layers": [
"language_model.model.layers.57.mlp.gate_proj",
"language_model.model.layers.57.mlp.up_proj",
"language_model.model.layers.57.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.001631450653076183,
"dbits": 2080899072
}
]
},
{
"idx": 116,
"layers": [
"language_model.model.layers.58.self_attn.q_proj",
"language_model.model.layers.58.self_attn.k_proj",
"language_model.model.layers.58.self_attn.v_proj",
"language_model.model.layers.58.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.0004269838333129661,
"dbits": 396361728
}
]
},
{
"idx": 117,
"layers": [
"language_model.model.layers.58.mlp.gate_proj",
"language_model.model.layers.58.mlp.up_proj",
"language_model.model.layers.58.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.004021327197551772,
"dbits": 2080899072
}
]
},
{
"idx": 118,
"layers": [
"language_model.model.layers.59.self_attn.q_proj",
"language_model.model.layers.59.self_attn.k_proj",
"language_model.model.layers.59.self_attn.v_proj",
"language_model.model.layers.59.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0032634086906910276,
"dbits": 396361728
}
]
},
{
"idx": 119,
"layers": [
"language_model.model.layers.59.mlp.gate_proj",
"language_model.model.layers.59.mlp.up_proj",
"language_model.model.layers.59.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.005423430353403091,
"dbits": 2080899072
}
]
},
{
"idx": 120,
"layers": [
"language_model.model.layers.60.self_attn.q_proj",
"language_model.model.layers.60.self_attn.k_proj",
"language_model.model.layers.60.self_attn.v_proj",
"language_model.model.layers.60.self_attn.o_proj"
],
"candidates": [
{
"dkld": -0.0010337680578231812,
"dbits": 396361728
}
]
},
{
"idx": 121,
"layers": [
"language_model.model.layers.60.mlp.gate_proj",
"language_model.model.layers.60.mlp.up_proj",
"language_model.model.layers.60.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.008122941851615939,
"dbits": 2080899072
}
]
},
{
"idx": 122,
"layers": [
"language_model.model.layers.61.self_attn.q_proj",
"language_model.model.layers.61.self_attn.k_proj",
"language_model.model.layers.61.self_attn.v_proj",
"language_model.model.layers.61.self_attn.o_proj"
],
"candidates": [
{
"dkld": 0.00033112913370131336,
"dbits": 396361728
}
]
},
{
"idx": 123,
"layers": [
"language_model.model.layers.61.mlp.gate_proj",
"language_model.model.layers.61.mlp.up_proj",
"language_model.model.layers.61.mlp.down_proj"
],
"candidates": [
{
"dkld": -0.007963605970144283,
"dbits": 2080899072
}
]
}
],
"base_kld": 0.4373273827135563,
"arch_string": "Gemma3ForConditionalGeneration"
}