| { | |
| "base": { | |
| "dir": "D:\\main\\program\\AI\\CoridorGreenScreenMattingCPUfree\\tmp\\quants\\Gemma-3-R1984-27B-2.0bpw", | |
| "bpw": 2.004435066344246 | |
| }, | |
| "alts": [ | |
| { | |
| "dir": "D:\\main\\program\\AI\\CoridorGreenScreenMattingCPUfree\\tmp\\quants\\Gemma-3-R1984-27B-8.0bpw", | |
| "bpw": 8.004435066344247 | |
| } | |
| ], | |
| "groups": [ | |
| { | |
| "idx": 0, | |
| "layers": [ | |
| "language_model.model.layers.0.self_attn.q_proj", | |
| "language_model.model.layers.0.self_attn.k_proj", | |
| "language_model.model.layers.0.self_attn.v_proj", | |
| "language_model.model.layers.0.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.006917499005794525, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 1, | |
| "layers": [ | |
| "language_model.model.layers.0.mlp.gate_proj", | |
| "language_model.model.layers.0.mlp.up_proj", | |
| "language_model.model.layers.0.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.004495760053396247, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 2, | |
| "layers": [ | |
| "language_model.model.layers.1.self_attn.q_proj", | |
| "language_model.model.layers.1.self_attn.k_proj", | |
| "language_model.model.layers.1.self_attn.v_proj", | |
| "language_model.model.layers.1.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0004842020571231842, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 3, | |
| "layers": [ | |
| "language_model.model.layers.1.mlp.gate_proj", | |
| "language_model.model.layers.1.mlp.up_proj", | |
| "language_model.model.layers.1.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.005311993509531043, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 4, | |
| "layers": [ | |
| "language_model.model.layers.2.self_attn.q_proj", | |
| "language_model.model.layers.2.self_attn.k_proj", | |
| "language_model.model.layers.2.self_attn.v_proj", | |
| "language_model.model.layers.2.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0011243283748627042, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 5, | |
| "layers": [ | |
| "language_model.model.layers.2.mlp.gate_proj", | |
| "language_model.model.layers.2.mlp.up_proj", | |
| "language_model.model.layers.2.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.009011824429035198, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 6, | |
| "layers": [ | |
| "language_model.model.layers.3.self_attn.q_proj", | |
| "language_model.model.layers.3.self_attn.k_proj", | |
| "language_model.model.layers.3.self_attn.v_proj", | |
| "language_model.model.layers.3.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.003413629531860307, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 7, | |
| "layers": [ | |
| "language_model.model.layers.3.mlp.gate_proj", | |
| "language_model.model.layers.3.mlp.up_proj", | |
| "language_model.model.layers.3.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.006673009693622611, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 8, | |
| "layers": [ | |
| "language_model.model.layers.4.self_attn.q_proj", | |
| "language_model.model.layers.4.self_attn.k_proj", | |
| "language_model.model.layers.4.self_attn.v_proj", | |
| "language_model.model.layers.4.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0005826622247695479, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 9, | |
| "layers": [ | |
| "language_model.model.layers.4.mlp.gate_proj", | |
| "language_model.model.layers.4.mlp.up_proj", | |
| "language_model.model.layers.4.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0080329388380051, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 10, | |
| "layers": [ | |
| "language_model.model.layers.5.self_attn.q_proj", | |
| "language_model.model.layers.5.self_attn.k_proj", | |
| "language_model.model.layers.5.self_attn.v_proj", | |
| "language_model.model.layers.5.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0023767203092575073, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 11, | |
| "layers": [ | |
| "language_model.model.layers.5.mlp.gate_proj", | |
| "language_model.model.layers.5.mlp.up_proj", | |
| "language_model.model.layers.5.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.010135890543460868, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 12, | |
| "layers": [ | |
| "language_model.model.layers.6.self_attn.q_proj", | |
| "language_model.model.layers.6.self_attn.k_proj", | |
| "language_model.model.layers.6.self_attn.v_proj", | |
| "language_model.model.layers.6.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0027037844061851835, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 13, | |
| "layers": [ | |
| "language_model.model.layers.6.mlp.gate_proj", | |
| "language_model.model.layers.6.mlp.up_proj", | |
| "language_model.model.layers.6.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0041308201849460935, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 14, | |
| "layers": [ | |
| "language_model.model.layers.7.self_attn.q_proj", | |
| "language_model.model.layers.7.self_attn.k_proj", | |
| "language_model.model.layers.7.self_attn.v_proj", | |
| "language_model.model.layers.7.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0014376796782016865, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 15, | |
| "layers": [ | |
| "language_model.model.layers.7.mlp.gate_proj", | |
| "language_model.model.layers.7.mlp.up_proj", | |
| "language_model.model.layers.7.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.01197697520256047, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 16, | |
| "layers": [ | |
| "language_model.model.layers.8.self_attn.q_proj", | |
| "language_model.model.layers.8.self_attn.k_proj", | |
| "language_model.model.layers.8.self_attn.v_proj", | |
| "language_model.model.layers.8.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0037170641124248394, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 17, | |
| "layers": [ | |
| "language_model.model.layers.8.mlp.gate_proj", | |
| "language_model.model.layers.8.mlp.up_proj", | |
| "language_model.model.layers.8.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0004419878125190846, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 18, | |
| "layers": [ | |
| "language_model.model.layers.9.self_attn.q_proj", | |
| "language_model.model.layers.9.self_attn.k_proj", | |
| "language_model.model.layers.9.self_attn.v_proj", | |
| "language_model.model.layers.9.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.004326772689819347, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 19, | |
| "layers": [ | |
| "language_model.model.layers.9.mlp.gate_proj", | |
| "language_model.model.layers.9.mlp.up_proj", | |
| "language_model.model.layers.9.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.010839792340993915, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 20, | |
| "layers": [ | |
| "language_model.model.layers.10.self_attn.q_proj", | |
| "language_model.model.layers.10.self_attn.k_proj", | |
| "language_model.model.layers.10.self_attn.v_proj", | |
| "language_model.model.layers.10.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.009040921181440398, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 21, | |
| "layers": [ | |
| "language_model.model.layers.10.mlp.gate_proj", | |
| "language_model.model.layers.10.mlp.up_proj", | |
| "language_model.model.layers.10.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.031036542356014274, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 22, | |
| "layers": [ | |
| "language_model.model.layers.11.self_attn.q_proj", | |
| "language_model.model.layers.11.self_attn.k_proj", | |
| "language_model.model.layers.11.self_attn.v_proj", | |
| "language_model.model.layers.11.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.00979023426771164, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 23, | |
| "layers": [ | |
| "language_model.model.layers.11.mlp.gate_proj", | |
| "language_model.model.layers.11.mlp.up_proj", | |
| "language_model.model.layers.11.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.007736762613058112, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 24, | |
| "layers": [ | |
| "language_model.model.layers.12.self_attn.q_proj", | |
| "language_model.model.layers.12.self_attn.k_proj", | |
| "language_model.model.layers.12.self_attn.v_proj", | |
| "language_model.model.layers.12.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.003069894015789054, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 25, | |
| "layers": [ | |
| "language_model.model.layers.12.mlp.gate_proj", | |
| "language_model.model.layers.12.mlp.up_proj", | |
| "language_model.model.layers.12.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.014686931669712078, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 26, | |
| "layers": [ | |
| "language_model.model.layers.13.self_attn.q_proj", | |
| "language_model.model.layers.13.self_attn.k_proj", | |
| "language_model.model.layers.13.self_attn.v_proj", | |
| "language_model.model.layers.13.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.000129348039627053, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 27, | |
| "layers": [ | |
| "language_model.model.layers.13.mlp.gate_proj", | |
| "language_model.model.layers.13.mlp.up_proj", | |
| "language_model.model.layers.13.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.003941317647695564, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 28, | |
| "layers": [ | |
| "language_model.model.layers.14.self_attn.q_proj", | |
| "language_model.model.layers.14.self_attn.k_proj", | |
| "language_model.model.layers.14.self_attn.v_proj", | |
| "language_model.model.layers.14.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0035466991364956346, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 29, | |
| "layers": [ | |
| "language_model.model.layers.14.mlp.gate_proj", | |
| "language_model.model.layers.14.mlp.up_proj", | |
| "language_model.model.layers.14.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.022119185328483615, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 30, | |
| "layers": [ | |
| "language_model.model.layers.15.self_attn.q_proj", | |
| "language_model.model.layers.15.self_attn.k_proj", | |
| "language_model.model.layers.15.self_attn.v_proj", | |
| "language_model.model.layers.15.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.003810518234968141, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 31, | |
| "layers": [ | |
| "language_model.model.layers.15.mlp.gate_proj", | |
| "language_model.model.layers.15.mlp.up_proj", | |
| "language_model.model.layers.15.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.009127749502658877, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 32, | |
| "layers": [ | |
| "language_model.model.layers.16.self_attn.q_proj", | |
| "language_model.model.layers.16.self_attn.k_proj", | |
| "language_model.model.layers.16.self_attn.v_proj", | |
| "language_model.model.layers.16.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.006637018173933029, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 33, | |
| "layers": [ | |
| "language_model.model.layers.16.mlp.gate_proj", | |
| "language_model.model.layers.16.mlp.up_proj", | |
| "language_model.model.layers.16.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.021292066574096713, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 34, | |
| "layers": [ | |
| "language_model.model.layers.17.self_attn.q_proj", | |
| "language_model.model.layers.17.self_attn.k_proj", | |
| "language_model.model.layers.17.self_attn.v_proj", | |
| "language_model.model.layers.17.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0025063112378120866, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 35, | |
| "layers": [ | |
| "language_model.model.layers.17.mlp.gate_proj", | |
| "language_model.model.layers.17.mlp.up_proj", | |
| "language_model.model.layers.17.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0022593840956687816, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 36, | |
| "layers": [ | |
| "language_model.model.layers.18.self_attn.q_proj", | |
| "language_model.model.layers.18.self_attn.k_proj", | |
| "language_model.model.layers.18.self_attn.v_proj", | |
| "language_model.model.layers.18.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.002482272684574127, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 37, | |
| "layers": [ | |
| "language_model.model.layers.18.mlp.gate_proj", | |
| "language_model.model.layers.18.mlp.up_proj", | |
| "language_model.model.layers.18.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.000394851714372646, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 38, | |
| "layers": [ | |
| "language_model.model.layers.19.self_attn.q_proj", | |
| "language_model.model.layers.19.self_attn.k_proj", | |
| "language_model.model.layers.19.self_attn.v_proj", | |
| "language_model.model.layers.19.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0010013014078140703, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 39, | |
| "layers": [ | |
| "language_model.model.layers.19.mlp.gate_proj", | |
| "language_model.model.layers.19.mlp.up_proj", | |
| "language_model.model.layers.19.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.020440497994422935, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 40, | |
| "layers": [ | |
| "language_model.model.layers.20.self_attn.q_proj", | |
| "language_model.model.layers.20.self_attn.k_proj", | |
| "language_model.model.layers.20.self_attn.v_proj", | |
| "language_model.model.layers.20.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.004292172193527177, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 41, | |
| "layers": [ | |
| "language_model.model.layers.20.mlp.gate_proj", | |
| "language_model.model.layers.20.mlp.up_proj", | |
| "language_model.model.layers.20.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0009037740528583527, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 42, | |
| "layers": [ | |
| "language_model.model.layers.21.self_attn.q_proj", | |
| "language_model.model.layers.21.self_attn.k_proj", | |
| "language_model.model.layers.21.self_attn.v_proj", | |
| "language_model.model.layers.21.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.006902486085891724, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 43, | |
| "layers": [ | |
| "language_model.model.layers.21.mlp.gate_proj", | |
| "language_model.model.layers.21.mlp.up_proj", | |
| "language_model.model.layers.21.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.00929136574268341, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 44, | |
| "layers": [ | |
| "language_model.model.layers.22.self_attn.q_proj", | |
| "language_model.model.layers.22.self_attn.k_proj", | |
| "language_model.model.layers.22.self_attn.v_proj", | |
| "language_model.model.layers.22.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0036064453423023113, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 45, | |
| "layers": [ | |
| "language_model.model.layers.22.mlp.gate_proj", | |
| "language_model.model.layers.22.mlp.up_proj", | |
| "language_model.model.layers.22.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0006043247878551594, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 46, | |
| "layers": [ | |
| "language_model.model.layers.23.self_attn.q_proj", | |
| "language_model.model.layers.23.self_attn.k_proj", | |
| "language_model.model.layers.23.self_attn.v_proj", | |
| "language_model.model.layers.23.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.028081689029932022, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 47, | |
| "layers": [ | |
| "language_model.model.layers.23.mlp.gate_proj", | |
| "language_model.model.layers.23.mlp.up_proj", | |
| "language_model.model.layers.23.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.00137981697916989, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 48, | |
| "layers": [ | |
| "language_model.model.layers.24.self_attn.q_proj", | |
| "language_model.model.layers.24.self_attn.k_proj", | |
| "language_model.model.layers.24.self_attn.v_proj", | |
| "language_model.model.layers.24.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0014152429997921212, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 49, | |
| "layers": [ | |
| "language_model.model.layers.24.mlp.gate_proj", | |
| "language_model.model.layers.24.mlp.up_proj", | |
| "language_model.model.layers.24.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.004900486022233974, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 50, | |
| "layers": [ | |
| "language_model.model.layers.25.self_attn.q_proj", | |
| "language_model.model.layers.25.self_attn.k_proj", | |
| "language_model.model.layers.25.self_attn.v_proj", | |
| "language_model.model.layers.25.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.008432538062334072, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 51, | |
| "layers": [ | |
| "language_model.model.layers.25.mlp.gate_proj", | |
| "language_model.model.layers.25.mlp.up_proj", | |
| "language_model.model.layers.25.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.005563641339540459, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 52, | |
| "layers": [ | |
| "language_model.model.layers.26.self_attn.q_proj", | |
| "language_model.model.layers.26.self_attn.k_proj", | |
| "language_model.model.layers.26.self_attn.v_proj", | |
| "language_model.model.layers.26.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.010603216290473949, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 53, | |
| "layers": [ | |
| "language_model.model.layers.26.mlp.gate_proj", | |
| "language_model.model.layers.26.mlp.up_proj", | |
| "language_model.model.layers.26.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.003027988225221656, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 54, | |
| "layers": [ | |
| "language_model.model.layers.27.self_attn.q_proj", | |
| "language_model.model.layers.27.self_attn.k_proj", | |
| "language_model.model.layers.27.self_attn.v_proj", | |
| "language_model.model.layers.27.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.00233266279101374, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 55, | |
| "layers": [ | |
| "language_model.model.layers.27.mlp.gate_proj", | |
| "language_model.model.layers.27.mlp.up_proj", | |
| "language_model.model.layers.27.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0059184454381466245, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 56, | |
| "layers": [ | |
| "language_model.model.layers.28.self_attn.q_proj", | |
| "language_model.model.layers.28.self_attn.k_proj", | |
| "language_model.model.layers.28.self_attn.v_proj", | |
| "language_model.model.layers.28.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0004229128360748735, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 57, | |
| "layers": [ | |
| "language_model.model.layers.28.mlp.gate_proj", | |
| "language_model.model.layers.28.mlp.up_proj", | |
| "language_model.model.layers.28.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.007507449388504006, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 58, | |
| "layers": [ | |
| "language_model.model.layers.29.self_attn.q_proj", | |
| "language_model.model.layers.29.self_attn.k_proj", | |
| "language_model.model.layers.29.self_attn.v_proj", | |
| "language_model.model.layers.29.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0012179315090179443, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 59, | |
| "layers": [ | |
| "language_model.model.layers.29.mlp.gate_proj", | |
| "language_model.model.layers.29.mlp.up_proj", | |
| "language_model.model.layers.29.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.007656254619359926, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 60, | |
| "layers": [ | |
| "language_model.model.layers.30.self_attn.q_proj", | |
| "language_model.model.layers.30.self_attn.k_proj", | |
| "language_model.model.layers.30.self_attn.v_proj", | |
| "language_model.model.layers.30.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0006962120532989502, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 61, | |
| "layers": [ | |
| "language_model.model.layers.30.mlp.gate_proj", | |
| "language_model.model.layers.30.mlp.up_proj", | |
| "language_model.model.layers.30.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0112728171050549, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 62, | |
| "layers": [ | |
| "language_model.model.layers.31.self_attn.q_proj", | |
| "language_model.model.layers.31.self_attn.k_proj", | |
| "language_model.model.layers.31.self_attn.v_proj", | |
| "language_model.model.layers.31.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0017989106476307137, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 63, | |
| "layers": [ | |
| "language_model.model.layers.31.mlp.gate_proj", | |
| "language_model.model.layers.31.mlp.up_proj", | |
| "language_model.model.layers.31.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0063770614564419015, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 64, | |
| "layers": [ | |
| "language_model.model.layers.32.self_attn.q_proj", | |
| "language_model.model.layers.32.self_attn.k_proj", | |
| "language_model.model.layers.32.self_attn.v_proj", | |
| "language_model.model.layers.32.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.00029214099049568176, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 65, | |
| "layers": [ | |
| "language_model.model.layers.32.mlp.gate_proj", | |
| "language_model.model.layers.32.mlp.up_proj", | |
| "language_model.model.layers.32.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.006251434981823012, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 66, | |
| "layers": [ | |
| "language_model.model.layers.33.self_attn.q_proj", | |
| "language_model.model.layers.33.self_attn.k_proj", | |
| "language_model.model.layers.33.self_attn.v_proj", | |
| "language_model.model.layers.33.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0005352959036826754, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 67, | |
| "layers": [ | |
| "language_model.model.layers.33.mlp.gate_proj", | |
| "language_model.model.layers.33.mlp.up_proj", | |
| "language_model.model.layers.33.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.005572766810655605, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 68, | |
| "layers": [ | |
| "language_model.model.layers.34.self_attn.q_proj", | |
| "language_model.model.layers.34.self_attn.k_proj", | |
| "language_model.model.layers.34.self_attn.v_proj", | |
| "language_model.model.layers.34.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0008197985589504242, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 69, | |
| "layers": [ | |
| "language_model.model.layers.34.mlp.gate_proj", | |
| "language_model.model.layers.34.mlp.up_proj", | |
| "language_model.model.layers.34.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.004082408547401439, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 70, | |
| "layers": [ | |
| "language_model.model.layers.35.self_attn.q_proj", | |
| "language_model.model.layers.35.self_attn.k_proj", | |
| "language_model.model.layers.35.self_attn.v_proj", | |
| "language_model.model.layers.35.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0032249547541141066, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 71, | |
| "layers": [ | |
| "language_model.model.layers.35.mlp.gate_proj", | |
| "language_model.model.layers.35.mlp.up_proj", | |
| "language_model.model.layers.35.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0070062801241874695, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 72, | |
| "layers": [ | |
| "language_model.model.layers.36.self_attn.q_proj", | |
| "language_model.model.layers.36.self_attn.k_proj", | |
| "language_model.model.layers.36.self_attn.v_proj", | |
| "language_model.model.layers.36.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0005763806402683258, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 73, | |
| "layers": [ | |
| "language_model.model.layers.36.mlp.gate_proj", | |
| "language_model.model.layers.36.mlp.up_proj", | |
| "language_model.model.layers.36.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0030428156256676053, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 74, | |
| "layers": [ | |
| "language_model.model.layers.37.self_attn.q_proj", | |
| "language_model.model.layers.37.self_attn.k_proj", | |
| "language_model.model.layers.37.self_attn.v_proj", | |
| "language_model.model.layers.37.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0029344171285629606, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 75, | |
| "layers": [ | |
| "language_model.model.layers.37.mlp.gate_proj", | |
| "language_model.model.layers.37.mlp.up_proj", | |
| "language_model.model.layers.37.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.005395969003438972, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 76, | |
| "layers": [ | |
| "language_model.model.layers.38.self_attn.q_proj", | |
| "language_model.model.layers.38.self_attn.k_proj", | |
| "language_model.model.layers.38.self_attn.v_proj", | |
| "language_model.model.layers.38.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0017978318035602459, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 77, | |
| "layers": [ | |
| "language_model.model.layers.38.mlp.gate_proj", | |
| "language_model.model.layers.38.mlp.up_proj", | |
| "language_model.model.layers.38.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0036740973591804504, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 78, | |
| "layers": [ | |
| "language_model.model.layers.39.self_attn.q_proj", | |
| "language_model.model.layers.39.self_attn.k_proj", | |
| "language_model.model.layers.39.self_attn.v_proj", | |
| "language_model.model.layers.39.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0005030691623687522, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 79, | |
| "layers": [ | |
| "language_model.model.layers.39.mlp.gate_proj", | |
| "language_model.model.layers.39.mlp.up_proj", | |
| "language_model.model.layers.39.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.003146367520093951, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 80, | |
| "layers": [ | |
| "language_model.model.layers.40.self_attn.q_proj", | |
| "language_model.model.layers.40.self_attn.k_proj", | |
| "language_model.model.layers.40.self_attn.v_proj", | |
| "language_model.model.layers.40.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.008280515670776367, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 81, | |
| "layers": [ | |
| "language_model.model.layers.40.mlp.gate_proj", | |
| "language_model.model.layers.40.mlp.up_proj", | |
| "language_model.model.layers.40.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.004743161797523543, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 82, | |
| "layers": [ | |
| "language_model.model.layers.41.self_attn.q_proj", | |
| "language_model.model.layers.41.self_attn.k_proj", | |
| "language_model.model.layers.41.self_attn.v_proj", | |
| "language_model.model.layers.41.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.015289445966482185, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 83, | |
| "layers": [ | |
| "language_model.model.layers.41.mlp.gate_proj", | |
| "language_model.model.layers.41.mlp.up_proj", | |
| "language_model.model.layers.41.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.00837468057870866, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 84, | |
| "layers": [ | |
| "language_model.model.layers.42.self_attn.q_proj", | |
| "language_model.model.layers.42.self_attn.k_proj", | |
| "language_model.model.layers.42.self_attn.v_proj", | |
| "language_model.model.layers.42.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0007713317871094194, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 85, | |
| "layers": [ | |
| "language_model.model.layers.42.mlp.gate_proj", | |
| "language_model.model.layers.42.mlp.up_proj", | |
| "language_model.model.layers.42.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0034337289631367063, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 86, | |
| "layers": [ | |
| "language_model.model.layers.43.self_attn.q_proj", | |
| "language_model.model.layers.43.self_attn.k_proj", | |
| "language_model.model.layers.43.self_attn.v_proj", | |
| "language_model.model.layers.43.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.00845300778746605, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 87, | |
| "layers": [ | |
| "language_model.model.layers.43.mlp.gate_proj", | |
| "language_model.model.layers.43.mlp.up_proj", | |
| "language_model.model.layers.43.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.003721737116575252, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 88, | |
| "layers": [ | |
| "language_model.model.layers.44.self_attn.q_proj", | |
| "language_model.model.layers.44.self_attn.k_proj", | |
| "language_model.model.layers.44.self_attn.v_proj", | |
| "language_model.model.layers.44.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0051841072738170735, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 89, | |
| "layers": [ | |
| "language_model.model.layers.44.mlp.gate_proj", | |
| "language_model.model.layers.44.mlp.up_proj", | |
| "language_model.model.layers.44.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0031947255134582853, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 90, | |
| "layers": [ | |
| "language_model.model.layers.45.self_attn.q_proj", | |
| "language_model.model.layers.45.self_attn.k_proj", | |
| "language_model.model.layers.45.self_attn.v_proj", | |
| "language_model.model.layers.45.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.001118142157793045, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 91, | |
| "layers": [ | |
| "language_model.model.layers.45.mlp.gate_proj", | |
| "language_model.model.layers.45.mlp.up_proj", | |
| "language_model.model.layers.45.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0033696956932545152, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 92, | |
| "layers": [ | |
| "language_model.model.layers.46.self_attn.q_proj", | |
| "language_model.model.layers.46.self_attn.k_proj", | |
| "language_model.model.layers.46.self_attn.v_proj", | |
| "language_model.model.layers.46.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0005463138222694397, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 93, | |
| "layers": [ | |
| "language_model.model.layers.46.mlp.gate_proj", | |
| "language_model.model.layers.46.mlp.up_proj", | |
| "language_model.model.layers.46.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.006662502884864807, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 94, | |
| "layers": [ | |
| "language_model.model.layers.47.self_attn.q_proj", | |
| "language_model.model.layers.47.self_attn.k_proj", | |
| "language_model.model.layers.47.self_attn.v_proj", | |
| "language_model.model.layers.47.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0023998439311981312, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 95, | |
| "layers": [ | |
| "language_model.model.layers.47.mlp.gate_proj", | |
| "language_model.model.layers.47.mlp.up_proj", | |
| "language_model.model.layers.47.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.003466875106096279, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 96, | |
| "layers": [ | |
| "language_model.model.layers.48.self_attn.q_proj", | |
| "language_model.model.layers.48.self_attn.k_proj", | |
| "language_model.model.layers.48.self_attn.v_proj", | |
| "language_model.model.layers.48.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.004037512093782447, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 97, | |
| "layers": [ | |
| "language_model.model.layers.48.mlp.gate_proj", | |
| "language_model.model.layers.48.mlp.up_proj", | |
| "language_model.model.layers.48.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.003907855600118637, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 98, | |
| "layers": [ | |
| "language_model.model.layers.49.self_attn.q_proj", | |
| "language_model.model.layers.49.self_attn.k_proj", | |
| "language_model.model.layers.49.self_attn.v_proj", | |
| "language_model.model.layers.49.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0028403460979462003, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 99, | |
| "layers": [ | |
| "language_model.model.layers.49.mlp.gate_proj", | |
| "language_model.model.layers.49.mlp.up_proj", | |
| "language_model.model.layers.49.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.002681272476911578, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 100, | |
| "layers": [ | |
| "language_model.model.layers.50.self_attn.q_proj", | |
| "language_model.model.layers.50.self_attn.k_proj", | |
| "language_model.model.layers.50.self_attn.v_proj", | |
| "language_model.model.layers.50.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0014717683196068254, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 101, | |
| "layers": [ | |
| "language_model.model.layers.50.mlp.gate_proj", | |
| "language_model.model.layers.50.mlp.up_proj", | |
| "language_model.model.layers.50.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0033254854381084553, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 102, | |
| "layers": [ | |
| "language_model.model.layers.51.self_attn.q_proj", | |
| "language_model.model.layers.51.self_attn.k_proj", | |
| "language_model.model.layers.51.self_attn.v_proj", | |
| "language_model.model.layers.51.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0007418908178806749, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 103, | |
| "layers": [ | |
| "language_model.model.layers.51.mlp.gate_proj", | |
| "language_model.model.layers.51.mlp.up_proj", | |
| "language_model.model.layers.51.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0038238234817982164, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 104, | |
| "layers": [ | |
| "language_model.model.layers.52.self_attn.q_proj", | |
| "language_model.model.layers.52.self_attn.k_proj", | |
| "language_model.model.layers.52.self_attn.v_proj", | |
| "language_model.model.layers.52.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0012986376881599648, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 105, | |
| "layers": [ | |
| "language_model.model.layers.52.mlp.gate_proj", | |
| "language_model.model.layers.52.mlp.up_proj", | |
| "language_model.model.layers.52.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0018054209649562836, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 106, | |
| "layers": [ | |
| "language_model.model.layers.53.self_attn.q_proj", | |
| "language_model.model.layers.53.self_attn.k_proj", | |
| "language_model.model.layers.53.self_attn.v_proj", | |
| "language_model.model.layers.53.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.004864251613616977, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 107, | |
| "layers": [ | |
| "language_model.model.layers.53.mlp.gate_proj", | |
| "language_model.model.layers.53.mlp.up_proj", | |
| "language_model.model.layers.53.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0019967712461948506, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 108, | |
| "layers": [ | |
| "language_model.model.layers.54.self_attn.q_proj", | |
| "language_model.model.layers.54.self_attn.k_proj", | |
| "language_model.model.layers.54.self_attn.v_proj", | |
| "language_model.model.layers.54.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -5.696490406992272e-05, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 109, | |
| "layers": [ | |
| "language_model.model.layers.54.mlp.gate_proj", | |
| "language_model.model.layers.54.mlp.up_proj", | |
| "language_model.model.layers.54.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0024598926305771096, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 110, | |
| "layers": [ | |
| "language_model.model.layers.55.self_attn.q_proj", | |
| "language_model.model.layers.55.self_attn.k_proj", | |
| "language_model.model.layers.55.self_attn.v_proj", | |
| "language_model.model.layers.55.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0008994087576865706, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 111, | |
| "layers": [ | |
| "language_model.model.layers.55.mlp.gate_proj", | |
| "language_model.model.layers.55.mlp.up_proj", | |
| "language_model.model.layers.55.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.003040955960750602, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 112, | |
| "layers": [ | |
| "language_model.model.layers.56.self_attn.q_proj", | |
| "language_model.model.layers.56.self_attn.k_proj", | |
| "language_model.model.layers.56.self_attn.v_proj", | |
| "language_model.model.layers.56.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0004954591393471208, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 113, | |
| "layers": [ | |
| "language_model.model.layers.56.mlp.gate_proj", | |
| "language_model.model.layers.56.mlp.up_proj", | |
| "language_model.model.layers.56.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.002797749638557445, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 114, | |
| "layers": [ | |
| "language_model.model.layers.57.self_attn.q_proj", | |
| "language_model.model.layers.57.self_attn.k_proj", | |
| "language_model.model.layers.57.self_attn.v_proj", | |
| "language_model.model.layers.57.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0017556458711624479, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 115, | |
| "layers": [ | |
| "language_model.model.layers.57.mlp.gate_proj", | |
| "language_model.model.layers.57.mlp.up_proj", | |
| "language_model.model.layers.57.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.001631450653076183, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 116, | |
| "layers": [ | |
| "language_model.model.layers.58.self_attn.q_proj", | |
| "language_model.model.layers.58.self_attn.k_proj", | |
| "language_model.model.layers.58.self_attn.v_proj", | |
| "language_model.model.layers.58.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.0004269838333129661, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 117, | |
| "layers": [ | |
| "language_model.model.layers.58.mlp.gate_proj", | |
| "language_model.model.layers.58.mlp.up_proj", | |
| "language_model.model.layers.58.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.004021327197551772, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 118, | |
| "layers": [ | |
| "language_model.model.layers.59.self_attn.q_proj", | |
| "language_model.model.layers.59.self_attn.k_proj", | |
| "language_model.model.layers.59.self_attn.v_proj", | |
| "language_model.model.layers.59.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0032634086906910276, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 119, | |
| "layers": [ | |
| "language_model.model.layers.59.mlp.gate_proj", | |
| "language_model.model.layers.59.mlp.up_proj", | |
| "language_model.model.layers.59.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.005423430353403091, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 120, | |
| "layers": [ | |
| "language_model.model.layers.60.self_attn.q_proj", | |
| "language_model.model.layers.60.self_attn.k_proj", | |
| "language_model.model.layers.60.self_attn.v_proj", | |
| "language_model.model.layers.60.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.0010337680578231812, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 121, | |
| "layers": [ | |
| "language_model.model.layers.60.mlp.gate_proj", | |
| "language_model.model.layers.60.mlp.up_proj", | |
| "language_model.model.layers.60.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.008122941851615939, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 122, | |
| "layers": [ | |
| "language_model.model.layers.61.self_attn.q_proj", | |
| "language_model.model.layers.61.self_attn.k_proj", | |
| "language_model.model.layers.61.self_attn.v_proj", | |
| "language_model.model.layers.61.self_attn.o_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": 0.00033112913370131336, | |
| "dbits": 396361728 | |
| } | |
| ] | |
| }, | |
| { | |
| "idx": 123, | |
| "layers": [ | |
| "language_model.model.layers.61.mlp.gate_proj", | |
| "language_model.model.layers.61.mlp.up_proj", | |
| "language_model.model.layers.61.mlp.down_proj" | |
| ], | |
| "candidates": [ | |
| { | |
| "dkld": -0.007963605970144283, | |
| "dbits": 2080899072 | |
| } | |
| ] | |
| } | |
| ], | |
| "base_kld": 0.4373273827135563, | |
| "arch_string": "Gemma3ForConditionalGeneration" | |
| } |