Qwen3.6-27B-GPTQ-Int4 / quant_log.csv
palmfuture's picture
Initial release: GPTQ Int4 uniform g32 + MTP
bfc56ac verified
layer,module,loss,samples,damp,time
0,linear_attn.in_proj_qkv,0.0003197445,0.05000,2.228
0,linear_attn.in_proj_z,0.0002064770,0.05000,2.027
0,linear_attn.out_proj,0.0000001519,0.05000,2.319
0,mlp.up_proj,0.0000019669,0.05000,2.673
0,mlp.gate_proj,0.0000021337,0.05000,2.799
0,mlp.down_proj,0.0000000202,0.05000,9.369
1,linear_attn.in_proj_qkv,0.0000158468,0.05000,1.846
1,linear_attn.in_proj_z,0.0000097547,0.05000,1.875
1,linear_attn.out_proj,0.0000000610,0.05000,2.394
1,mlp.up_proj,0.0000043260,0.05000,2.832
1,mlp.gate_proj,0.0000045451,0.05000,2.806
1,mlp.down_proj,0.0000000292,0.05000,9.841
2,linear_attn.in_proj_qkv,0.0000236378,0.05000,1.961
2,linear_attn.in_proj_z,0.0000143486,0.05000,1.805
2,linear_attn.out_proj,0.0000000818,0.05000,2.354
2,mlp.gate_proj,0.0000083266,0.05000,2.744
2,mlp.up_proj,0.0000078148,0.05000,2.820
2,mlp.down_proj,0.0000001103,0.05000,9.239
3,self_attn.k_proj,0.0000168175,0.05000,3.962
3,self_attn.v_proj,0.0000166043,0.05000,4.016
3,self_attn.q_proj,0.0002342821,0.05000,4.118
3,self_attn.o_proj,0.0000000840,0.05000,2.620
3,mlp.gate_proj,0.0000101265,0.05000,2.768
3,mlp.up_proj,0.0000097521,0.05000,2.807
3,mlp.down_proj,0.0000000773,0.05000,9.705
4,linear_attn.in_proj_qkv,0.0000327987,0.05000,2.108
4,linear_attn.in_proj_z,0.0000209418,0.05000,1.814
4,linear_attn.out_proj,0.0000001242,0.05000,2.427
4,mlp.gate_proj,0.0000135747,0.05000,2.789
4,mlp.up_proj,0.0000131227,0.05000,2.835
4,mlp.down_proj,0.0000001075,0.05000,9.531
5,linear_attn.in_proj_qkv,0.0000415633,0.05000,1.970
5,linear_attn.in_proj_z,0.0000271475,0.05000,1.920
5,linear_attn.out_proj,0.0000001655,0.05000,2.505
5,mlp.gate_proj,0.0000173205,0.05000,2.811
5,mlp.up_proj,0.0000162889,0.05000,2.830
5,mlp.down_proj,0.0000001692,0.05000,9.587
6,linear_attn.in_proj_qkv,0.0000621110,0.05000,2.009
6,linear_attn.in_proj_z,0.0000372702,0.05000,1.874
6,linear_attn.out_proj,0.0000002171,0.05000,2.481
6,mlp.up_proj,0.0000213310,0.05000,2.764
6,mlp.gate_proj,0.0000229309,0.05000,3.045
6,mlp.down_proj,0.0000002675,0.05000,9.538
7,self_attn.v_proj,0.0000145466,0.05000,3.755
7,self_attn.k_proj,0.0000158137,0.05000,3.900
7,self_attn.q_proj,0.0002015561,0.05000,4.001
7,self_attn.o_proj,0.0000001460,0.05000,2.417
7,mlp.gate_proj,0.0000258102,0.05000,2.853
7,mlp.up_proj,0.0000240012,0.05000,3.144
7,mlp.down_proj,0.0000003147,0.05000,9.532
8,linear_attn.in_proj_qkv,0.0000642539,0.05000,1.999
8,linear_attn.in_proj_z,0.0000405329,0.05000,1.941
8,linear_attn.out_proj,0.0000003066,0.05000,2.422
8,mlp.up_proj,0.0000270153,0.05000,2.813
8,mlp.gate_proj,0.0000288301,0.05000,2.838
8,mlp.down_proj,0.0000003754,0.05000,9.611
9,linear_attn.in_proj_qkv,0.0000657042,0.05000,1.955
9,linear_attn.in_proj_z,0.0000400837,0.05000,1.924
9,linear_attn.out_proj,0.0000003402,0.05000,2.335
9,mlp.up_proj,0.0000296260,0.05000,2.857
9,mlp.gate_proj,0.0000313970,0.05000,2.860
9,mlp.down_proj,0.0000004274,0.05000,9.500
10,linear_attn.in_proj_qkv,0.0000685984,0.05000,2.139
10,linear_attn.in_proj_z,0.0000406228,0.05000,2.094
10,linear_attn.out_proj,0.0000003843,0.05000,2.428
10,mlp.gate_proj,0.0000321583,0.05000,2.752
10,mlp.up_proj,0.0000305340,0.05000,2.788
10,mlp.down_proj,0.0000004743,0.05000,9.580
11,self_attn.k_proj,0.0000151571,0.05000,3.848
11,self_attn.v_proj,0.0000136842,0.05000,3.913
11,self_attn.q_proj,0.0001796321,0.05000,3.993
11,self_attn.o_proj,0.0000002628,0.05000,2.350
11,mlp.gate_proj,0.0000343429,0.05000,2.815
11,mlp.up_proj,0.0000327367,0.05000,2.870
11,mlp.down_proj,0.0000005578,0.05000,9.701
12,linear_attn.in_proj_qkv,0.0000775487,0.05000,1.976
12,linear_attn.in_proj_z,0.0000459151,0.05000,1.951
12,linear_attn.out_proj,0.0000005732,0.05000,2.360
12,mlp.gate_proj,0.0000356221,0.05000,2.867
12,mlp.up_proj,0.0000339428,0.05000,2.894
12,mlp.down_proj,0.0000006371,0.05000,9.814
13,linear_attn.in_proj_qkv,0.0000816816,0.05000,2.078
13,linear_attn.in_proj_z,0.0000461836,0.05000,2.012
13,linear_attn.out_proj,0.0000006304,0.05000,2.461
13,mlp.up_proj,0.0000364391,0.05000,2.754
13,mlp.gate_proj,0.0000382620,0.05000,3.088
13,mlp.down_proj,0.0000007334,0.05000,9.365
14,linear_attn.in_proj_qkv,0.0000896298,0.05000,1.918
14,linear_attn.in_proj_z,0.0000520888,0.05000,1.939
14,linear_attn.out_proj,0.0000007492,0.05000,2.463
14,mlp.up_proj,0.0000385812,0.05000,2.837
14,mlp.gate_proj,0.0000403974,0.05000,2.985
14,mlp.down_proj,0.0000008201,0.05000,9.448
15,self_attn.v_proj,0.0000131611,0.05000,3.857
15,self_attn.k_proj,0.0000135512,0.05000,3.920
15,self_attn.q_proj,0.0001546285,0.05000,4.023
15,self_attn.o_proj,0.0000004657,0.05000,2.425
15,mlp.gate_proj,0.0000461728,0.05000,2.800
15,mlp.up_proj,0.0000445283,0.05000,2.873
15,mlp.down_proj,0.0000009885,0.05000,9.419
16,linear_attn.in_proj_qkv,0.0000963353,0.05000,2.028
16,linear_attn.in_proj_z,0.0000548140,0.05000,2.275
16,linear_attn.out_proj,0.0000008343,0.05000,2.233
16,mlp.gate_proj,0.0000508629,0.05000,2.775
16,mlp.up_proj,0.0000487897,0.05000,2.822
16,mlp.down_proj,0.0000011787,0.05000,9.420
17,linear_attn.in_proj_qkv,0.0001095097,0.05000,2.049
17,linear_attn.in_proj_z,0.0000560735,0.05000,2.012
17,linear_attn.out_proj,0.0000011213,0.05000,2.254
17,mlp.gate_proj,0.0000583781,0.05000,2.725
17,mlp.up_proj,0.0000559772,0.05000,2.836
17,mlp.down_proj,0.0000015447,0.05000,9.683
18,linear_attn.in_proj_qkv,0.0001184729,0.05000,2.019
18,linear_attn.in_proj_z,0.0000651775,0.05000,1.983
18,linear_attn.out_proj,0.0000013323,0.05000,2.491
18,mlp.gate_proj,0.0000716857,0.05000,2.830
18,mlp.up_proj,0.0000672247,0.05000,2.852
18,mlp.down_proj,0.0000024226,0.05000,9.683
19,self_attn.k_proj,0.0000173523,0.05000,3.986
19,self_attn.v_proj,0.0000194091,0.05000,4.015
19,self_attn.q_proj,0.0001928319,0.05000,4.043
19,self_attn.o_proj,0.0000018063,0.05000,2.361
19,mlp.gate_proj,0.0000900986,0.05000,2.658
19,mlp.up_proj,0.0000849859,0.05000,2.772
19,mlp.down_proj,0.0000033498,0.05000,9.764
20,linear_attn.in_proj_qkv,0.0002139989,0.05000,2.011
20,linear_attn.in_proj_z,0.0001198187,0.05000,1.909
20,linear_attn.out_proj,0.0000021942,0.05000,2.544
20,mlp.gate_proj,0.0001100951,0.05000,2.911
20,mlp.up_proj,0.0001016944,0.05000,2.926
20,mlp.down_proj,0.0000038367,0.05000,9.316
21,linear_attn.in_proj_qkv,0.0002620370,0.05000,2.017
21,linear_attn.in_proj_z,0.0001673315,0.05000,1.818
21,linear_attn.out_proj,0.0000027516,0.05000,2.425
21,mlp.up_proj,0.0001115360,0.05000,2.836
21,mlp.gate_proj,0.0001198745,0.05000,2.846
21,mlp.down_proj,0.0000041294,0.05000,9.817
22,linear_attn.in_proj_qkv,0.0002282727,0.05000,2.019
22,linear_attn.in_proj_z,0.0001399470,0.05000,1.863
22,linear_attn.out_proj,0.0000025874,0.05000,2.483
22,mlp.up_proj,0.0001239583,0.05000,2.856
22,mlp.gate_proj,0.0001402319,0.05000,2.877
22,mlp.down_proj,0.0000046557,0.05000,9.638
23,self_attn.k_proj,0.0000247198,0.05000,3.962
23,self_attn.v_proj,0.0000262281,0.05000,3.982
23,self_attn.q_proj,0.0002511130,0.05000,4.052
23,self_attn.o_proj,0.0000022185,0.05000,2.408
23,mlp.up_proj,0.0001334481,0.05000,2.686
23,mlp.gate_proj,0.0001454333,0.05000,2.801
23,mlp.down_proj,0.0000048433,0.05000,9.444
24,linear_attn.in_proj_qkv,0.0002210956,0.05000,1.948
24,linear_attn.in_proj_z,0.0001247617,0.05000,1.858
24,linear_attn.out_proj,0.0000031194,0.05000,2.483
24,mlp.up_proj,0.0001440041,0.05000,2.787
24,mlp.gate_proj,0.0001577180,0.05000,2.968
24,mlp.down_proj,0.0000056242,0.05000,9.495
25,linear_attn.in_proj_qkv,0.0002246287,0.05000,2.023
25,linear_attn.in_proj_z,0.0001186763,0.05000,1.911
25,linear_attn.out_proj,0.0000031973,0.05000,2.360
25,mlp.up_proj,0.0001451803,0.05000,2.870
25,mlp.gate_proj,0.0001504104,0.05000,2.889
25,mlp.down_proj,0.0000056412,0.05000,9.788
26,linear_attn.in_proj_qkv,0.0002032605,0.05000,2.094
26,linear_attn.in_proj_z,0.0001032550,0.05000,1.979
26,linear_attn.out_proj,0.0000033678,0.05000,2.544
26,mlp.gate_proj,0.0001398861,0.05000,2.824
26,mlp.up_proj,0.0001431139,0.05000,2.828
26,mlp.down_proj,0.0000059178,0.05000,9.702
27,self_attn.v_proj,0.0000209463,0.05000,3.962
27,self_attn.k_proj,0.0000228403,0.05000,4.013
27,self_attn.q_proj,0.0002288074,0.05000,4.068
27,self_attn.o_proj,0.0000044184,0.05000,2.295
27,mlp.up_proj,0.0001511458,0.05000,2.871
27,mlp.gate_proj,0.0001433983,0.05000,2.919
27,mlp.down_proj,0.0000063376,0.05000,9.524
28,linear_attn.in_proj_qkv,0.0001990004,0.05000,2.131
28,linear_attn.in_proj_z,0.0000942670,0.05000,1.998
28,linear_attn.out_proj,0.0000041844,0.05000,2.418
28,mlp.up_proj,0.0001480044,0.05000,2.869
28,mlp.gate_proj,0.0001377359,0.05000,2.896
28,mlp.down_proj,0.0000064281,0.05000,9.705
29,linear_attn.in_proj_qkv,0.0002153540,0.05000,1.966
29,linear_attn.in_proj_z,0.0001002709,0.05000,2.028
29,linear_attn.out_proj,0.0000037770,0.05000,2.416
29,mlp.up_proj,0.0001485866,0.05000,2.798
29,mlp.gate_proj,0.0001374452,0.05000,3.063
29,mlp.down_proj,0.0000064556,0.05000,9.480
30,linear_attn.in_proj_qkv,0.0002151987,0.05000,1.994
30,linear_attn.in_proj_z,0.0001021870,0.05000,1.998
30,linear_attn.out_proj,0.0000047097,0.05000,2.726
30,mlp.gate_proj,0.0001347883,0.05000,2.856
30,mlp.up_proj,0.0001493319,0.05000,2.911
30,mlp.down_proj,0.0000066001,0.05000,9.961
31,self_attn.k_proj,0.0000226690,0.05000,3.858
31,self_attn.v_proj,0.0000261192,0.05000,3.924
31,self_attn.q_proj,0.0002197505,0.05000,4.045
31,self_attn.o_proj,0.0000056364,0.05000,2.382
31,mlp.up_proj,0.0001621095,0.05000,2.591
31,mlp.gate_proj,0.0001435794,0.05000,2.934
31,mlp.down_proj,0.0000072634,0.05000,9.668
32,linear_attn.in_proj_qkv,0.0002293290,0.05000,1.991
32,linear_attn.in_proj_z,0.0001018995,0.05000,1.925
32,linear_attn.out_proj,0.0000049107,0.05000,2.322
32,mlp.up_proj,0.0001718162,0.05000,2.772
32,mlp.gate_proj,0.0001514548,0.05000,2.775
32,mlp.down_proj,0.0000077587,0.05000,9.593
33,linear_attn.in_proj_qkv,0.0002702387,0.05000,1.989
33,linear_attn.in_proj_z,0.0001137513,0.05000,2.022
33,linear_attn.out_proj,0.0000057096,0.05000,2.358
33,mlp.gate_proj,0.0001562763,0.05000,2.871
33,mlp.up_proj,0.0001783576,0.05000,2.878
33,mlp.down_proj,0.0000078964,0.05000,9.727
34,linear_attn.in_proj_qkv,0.0002623729,0.05000,2.051
34,linear_attn.in_proj_z,0.0001201794,0.05000,2.045
34,linear_attn.out_proj,0.0000058287,0.05000,2.418
34,mlp.gate_proj,0.0001680708,0.05000,2.780
34,mlp.up_proj,0.0001894957,0.05000,2.798
34,mlp.down_proj,0.0000102192,0.05000,9.354
35,self_attn.k_proj,0.0000276489,0.05000,3.962
35,self_attn.v_proj,0.0000388686,0.05000,3.962
35,self_attn.q_proj,0.0002702927,0.05000,3.983
35,self_attn.o_proj,0.0000094047,0.05000,2.309
35,mlp.gate_proj,0.0001789629,0.05000,2.753
35,mlp.up_proj,0.0001953928,0.05000,2.763
35,mlp.down_proj,0.0000115370,0.05000,9.672
36,linear_attn.in_proj_qkv,0.0003655588,0.05000,2.060
36,linear_attn.in_proj_z,0.0001855907,0.05000,1.984
36,linear_attn.out_proj,0.0000057162,0.05000,2.465
36,mlp.up_proj,0.0001925602,0.05000,2.874
36,mlp.gate_proj,0.0001991262,0.05000,2.885
36,mlp.down_proj,0.0000104420,0.05000,9.674
37,linear_attn.in_proj_qkv,0.0003918287,0.05000,1.928
37,linear_attn.in_proj_z,0.0002275343,0.05000,2.004
37,linear_attn.out_proj,0.0000059617,0.05000,2.311
37,mlp.gate_proj,0.0002017582,0.05000,2.795
37,mlp.up_proj,0.0001917516,0.05000,2.853
37,mlp.down_proj,0.0000098027,0.05000,9.710
38,linear_attn.in_proj_qkv,0.0003525520,0.05000,2.006
38,linear_attn.in_proj_z,0.0002091738,0.05000,1.879
38,linear_attn.out_proj,0.0000046830,0.05000,2.345
38,mlp.gate_proj,0.0002641791,0.05000,2.838
38,mlp.up_proj,0.0002142234,0.05000,3.150
38,mlp.down_proj,0.0000099394,0.05000,9.727
39,self_attn.v_proj,0.0000394056,0.05000,4.145
39,self_attn.k_proj,0.0000318873,0.05000,4.213
39,self_attn.q_proj,0.0003112402,0.05000,4.256
39,self_attn.o_proj,0.0000060011,0.05000,2.287
39,mlp.gate_proj,0.0002393658,0.05000,2.810
39,mlp.up_proj,0.0002080120,0.05000,2.840
39,mlp.down_proj,0.0000092458,0.05000,9.717
40,linear_attn.in_proj_qkv,0.0003310422,0.05000,2.307
40,linear_attn.in_proj_z,0.0001864410,0.05000,1.976
40,linear_attn.out_proj,0.0000053041,0.05000,2.429
40,mlp.up_proj,0.0002204887,0.05000,2.837
40,mlp.gate_proj,0.0002607984,0.05000,2.884
40,mlp.down_proj,0.0000098098,0.05000,9.740
41,linear_attn.in_proj_qkv,0.0003050378,0.05000,1.945
41,linear_attn.in_proj_z,0.0001696298,0.05000,1.996
41,linear_attn.out_proj,0.0000046962,0.05000,2.688
41,mlp.up_proj,0.0002130802,0.05000,2.855
41,mlp.gate_proj,0.0002247281,0.05000,2.862
41,mlp.down_proj,0.0000096282,0.05000,9.423
42,linear_attn.in_proj_qkv,0.0002849892,0.05000,2.075
42,linear_attn.in_proj_z,0.0001530167,0.05000,1.877
42,linear_attn.out_proj,0.0000052826,0.05000,2.569
42,mlp.gate_proj,0.0002039032,0.05000,2.780
42,mlp.up_proj,0.0002093354,0.05000,2.879
42,mlp.down_proj,0.0000104336,0.05000,9.630
43,self_attn.k_proj,0.0000311214,0.05000,3.924
43,self_attn.v_proj,0.0000381165,0.05000,4.046
43,self_attn.q_proj,0.0002958142,0.05000,4.107
43,self_attn.o_proj,0.0000087401,0.05000,2.359
43,mlp.up_proj,0.0002176778,0.05000,2.853
43,mlp.gate_proj,0.0002034712,0.05000,2.874
43,mlp.down_proj,0.0000114969,0.05000,10.142
44,linear_attn.in_proj_qkv,0.0002739369,0.05000,2.060
44,linear_attn.in_proj_z,0.0001355589,0.05000,1.968
44,linear_attn.out_proj,0.0000074509,0.05000,2.427
44,mlp.up_proj,0.0002208027,0.05000,2.832
44,mlp.gate_proj,0.0002033508,0.05000,2.878
44,mlp.down_proj,0.0000129796,0.05000,9.866
45,linear_attn.in_proj_qkv,0.0002792265,0.05000,2.067
45,linear_attn.in_proj_z,0.0001384729,0.05000,2.072
45,linear_attn.out_proj,0.0000065496,0.05000,2.394
45,mlp.up_proj,0.0002234423,0.05000,2.918
45,mlp.gate_proj,0.0002046250,0.05000,2.939
45,mlp.down_proj,0.0000134076,0.05000,9.396
46,linear_attn.in_proj_qkv,0.0002909530,0.05000,2.012
46,linear_attn.in_proj_z,0.0001456825,0.05000,2.002
46,linear_attn.out_proj,0.0000095057,0.05000,2.464
46,mlp.gate_proj,0.0002010068,0.05000,2.793
46,mlp.up_proj,0.0002256891,0.05000,2.816
46,mlp.down_proj,0.0000143541,0.05000,9.666
47,self_attn.v_proj,0.0000506427,0.05000,3.942
47,self_attn.q_proj,0.0003168942,0.05000,4.071
47,self_attn.k_proj,0.0000321328,0.05000,4.077
47,self_attn.o_proj,0.0000101120,0.05000,2.398
47,mlp.gate_proj,0.0002227599,0.05000,2.660
47,mlp.up_proj,0.0002490375,0.05000,2.815
47,mlp.down_proj,0.0000175623,0.05000,9.421
48,linear_attn.in_proj_qkv,0.0003186905,0.05000,1.999
48,linear_attn.in_proj_z,0.0001540790,0.05000,1.970
48,linear_attn.out_proj,0.0000110738,0.05000,2.431
48,mlp.gate_proj,0.0002386876,0.05000,2.867
48,mlp.up_proj,0.0002675655,0.05000,2.881
48,mlp.down_proj,0.0000212672,0.05000,9.621
49,linear_attn.in_proj_qkv,0.0003820718,0.05000,2.009
49,linear_attn.in_proj_z,0.0001642076,0.05000,1.910
49,linear_attn.out_proj,0.0000149738,0.05000,2.275
49,mlp.gate_proj,0.0002584349,0.05000,2.741
49,mlp.up_proj,0.0002866655,0.05000,2.790
49,mlp.down_proj,0.0000272903,0.05000,9.620
50,linear_attn.in_proj_qkv,0.0003893767,0.05000,2.039
50,linear_attn.in_proj_z,0.0001826149,0.05000,1.886
50,linear_attn.out_proj,0.0000220006,0.05000,2.407
50,mlp.up_proj,0.0003265009,0.05000,2.806
50,mlp.gate_proj,0.0003083456,0.05000,2.852
50,mlp.down_proj,0.0000455937,0.05000,9.704
51,self_attn.k_proj,0.0000418068,0.05000,3.974
51,self_attn.q_proj,0.0004121897,0.05000,4.004
51,self_attn.v_proj,0.0000925749,0.05000,4.031
51,self_attn.o_proj,0.0000293543,0.05000,2.477
51,mlp.gate_proj,0.0003434407,0.05000,2.824
51,mlp.up_proj,0.0003731706,0.05000,2.881
51,mlp.down_proj,0.0000584166,0.05000,9.791
52,linear_attn.in_proj_qkv,0.0005982841,0.05000,2.058
52,linear_attn.in_proj_z,0.0002757637,0.05000,2.004
52,linear_attn.out_proj,0.0000300584,0.05000,2.357
52,mlp.gate_proj,0.0004216733,0.05000,2.768
52,mlp.up_proj,0.0004031492,0.05000,3.058
52,mlp.down_proj,0.0000588965,0.05000,9.417
53,linear_attn.in_proj_qkv,0.0005947312,0.05000,1.999
53,linear_attn.in_proj_z,0.0002927151,0.05000,2.049
53,linear_attn.out_proj,0.0000332334,0.05000,2.384
53,mlp.up_proj,0.0004268191,0.05000,2.878
53,mlp.gate_proj,0.0004694973,0.05000,2.915
53,mlp.down_proj,0.0000641496,0.05000,9.748
54,linear_attn.in_proj_qkv,0.0005754633,0.05000,2.075
54,linear_attn.in_proj_z,0.0003124722,0.05000,1.922
54,linear_attn.out_proj,0.0000333667,0.05000,2.403
54,mlp.up_proj,0.0005059157,0.05000,2.791
54,mlp.gate_proj,0.0005929848,0.05000,2.831
54,mlp.down_proj,0.0000913851,0.05000,9.517
55,self_attn.q_proj,0.0005465929,0.05000,3.951
55,self_attn.v_proj,0.0001239293,0.05000,3.981
55,self_attn.k_proj,0.0000579751,0.05000,4.000
55,self_attn.o_proj,0.0000298551,0.05000,2.327
55,mlp.gate_proj,0.0005700416,0.05000,2.823
55,mlp.up_proj,0.0005092237,0.05000,2.834
55,mlp.down_proj,0.0000769449,0.05000,9.598
56,linear_attn.in_proj_qkv,0.0006624743,0.05000,1.882
56,linear_attn.in_proj_z,0.0003330500,0.05000,1.871
56,linear_attn.out_proj,0.0000457990,0.05000,2.365
56,mlp.gate_proj,0.0006302628,0.05000,2.915
56,mlp.up_proj,0.0005478271,0.05000,3.194
56,mlp.down_proj,0.0000767774,0.05000,9.813
57,linear_attn.in_proj_qkv,0.0007052206,0.05000,2.025
57,linear_attn.in_proj_z,0.0003543249,0.05000,2.000
57,linear_attn.out_proj,0.0000407313,0.05000,2.426
57,mlp.up_proj,0.0006268600,0.05000,2.788
57,mlp.gate_proj,0.0007333108,0.05000,2.868
57,mlp.down_proj,0.0000806746,0.05000,9.734
58,linear_attn.in_proj_qkv,0.0006764381,0.05000,2.249
58,linear_attn.in_proj_z,0.0003702752,0.05000,1.827
58,linear_attn.out_proj,0.0000439231,0.05000,2.325
58,mlp.up_proj,0.0007224930,0.05000,2.771
58,mlp.gate_proj,0.0008458127,0.05000,2.851
58,mlp.down_proj,0.0001073471,0.05000,9.706
59,self_attn.v_proj,0.0002534219,0.05000,3.880
59,self_attn.k_proj,0.0000720708,0.05000,3.934
59,self_attn.q_proj,0.0006471389,0.05000,4.061
59,self_attn.o_proj,0.0000865519,0.05000,2.479
59,mlp.up_proj,0.0007308760,0.05000,2.750
59,mlp.gate_proj,0.0008335251,0.05000,2.801
59,mlp.down_proj,0.0001261923,0.05000,9.394
60,linear_attn.in_proj_qkv,0.0008105025,0.05000,2.106
60,linear_attn.in_proj_z,0.0003880060,0.05000,2.010
60,linear_attn.out_proj,0.0001007381,0.05000,2.189
60,mlp.gate_proj,0.0008283832,0.05000,2.740
60,mlp.up_proj,0.0007406551,0.05000,2.780
60,mlp.down_proj,0.0001567032,0.05000,9.783
61,linear_attn.in_proj_qkv,0.0006010910,0.05000,1.947
61,linear_attn.in_proj_z,0.0003464860,0.05000,1.794
61,linear_attn.out_proj,0.0000901399,0.05000,2.424
61,mlp.up_proj,0.0007882093,0.05000,2.968
61,mlp.gate_proj,0.0008725039,0.05000,2.987
61,mlp.down_proj,0.0002059536,0.05000,9.399
62,linear_attn.in_proj_qkv,0.0006572308,0.05000,2.043
62,linear_attn.in_proj_z,0.0003461558,0.05000,2.032
62,linear_attn.out_proj,0.0002392242,0.05000,2.488
62,mlp.up_proj,0.0007274505,0.05000,2.755
62,mlp.gate_proj,0.0008007132,0.05000,2.820
62,mlp.down_proj,0.0003095795,0.05000,9.611
63,self_attn.v_proj,0.0002023079,0.05000,3.974
63,self_attn.k_proj,0.0000646610,0.05000,3.993
63,self_attn.q_proj,0.0005759815,0.05000,4.071
63,self_attn.o_proj,0.0002338829,0.05000,2.411
63,mlp.gate_proj,0.0006730167,0.05000,2.771
63,mlp.up_proj,0.0005922088,0.05000,2.782
63,mlp.down_proj,0.0006151453,0.05000,9.336