MNLP_M3_quantized_model / quant_log.csv
RangerX's picture
Upload folder using huggingface_hub
8dc01a0 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0102534108,0.05000,0.499
0,self_attn.v_proj,0.0079884017,0.05000,0.270
0,self_attn.q_proj,0.0232020114,0.05000,0.277
0,self_attn.o_proj,0.0059849275,0.05000,0.541
0,mlp.gate_proj,0.2101839185,0.05000,0.273
0,mlp.up_proj,0.1052171737,0.05000,0.271
0,mlp.down_proj,0.0060404502,0.05000,1.081
1,self_attn.k_proj,0.0035987182,0.05000,0.270
1,self_attn.v_proj,0.0033963406,0.05000,0.271
1,self_attn.q_proj,0.0081585497,0.05000,0.268
1,self_attn.o_proj,0.0016202630,0.05000,0.530
1,mlp.gate_proj,1.3692135811,0.05000,0.272
1,mlp.up_proj,0.4010225534,0.05000,0.270
1,mlp.down_proj,0.0095159207,0.05000,0.812
2,self_attn.k_proj,0.0069046794,0.05000,0.268
2,self_attn.v_proj,0.0065494906,0.05000,0.274
2,self_attn.q_proj,0.0161531456,0.05000,0.267
2,self_attn.o_proj,0.0026321127,0.05000,0.539
2,mlp.gate_proj,0.9242770672,0.05000,0.269
2,mlp.up_proj,0.3328490257,0.05000,0.271
2,mlp.down_proj,12.6786127090,0.05000,0.812
3,self_attn.k_proj,0.0600524060,0.05000,0.267
3,self_attn.v_proj,0.0603904948,0.05000,0.270
3,self_attn.q_proj,0.1229075640,0.05000,0.266
3,self_attn.o_proj,0.0060743806,0.05000,0.533
3,mlp.gate_proj,1.1898157597,0.05000,0.269
3,mlp.up_proj,0.4574447274,0.05000,0.268
3,mlp.down_proj,0.0240235925,0.05000,0.809
4,self_attn.k_proj,0.0597024262,0.05000,0.269
4,self_attn.v_proj,0.0602943413,0.05000,0.266
4,self_attn.q_proj,0.1205628663,0.05000,0.268
4,self_attn.o_proj,0.0091588972,0.05000,0.532
4,mlp.gate_proj,1.0823590755,0.05000,0.274
4,mlp.up_proj,0.4695992768,0.05000,0.269
4,mlp.down_proj,0.0285880528,0.05000,0.810
5,self_attn.k_proj,0.0870025828,0.05000,0.268
5,self_attn.v_proj,0.0894146040,0.05000,0.270
5,self_attn.q_proj,0.2058143020,0.05000,0.267
5,self_attn.o_proj,0.0124091133,0.05000,0.540
5,mlp.gate_proj,0.7296952605,0.05000,0.269
5,mlp.up_proj,0.4307921827,0.05000,0.267
5,mlp.down_proj,0.0321102552,0.05000,0.815
6,self_attn.k_proj,0.0651639923,0.05000,0.270
6,self_attn.v_proj,0.0574318357,0.05000,0.271
6,self_attn.q_proj,0.1408478618,0.05000,0.284
6,self_attn.o_proj,0.0105036153,0.05000,0.559
6,mlp.gate_proj,0.8694056273,0.05000,0.277
6,mlp.up_proj,0.5381510854,0.05000,0.270
6,mlp.down_proj,0.0412271991,0.05000,0.817
7,self_attn.k_proj,0.1137319654,0.05000,0.272
7,self_attn.v_proj,0.1268429458,0.05000,0.269
7,self_attn.q_proj,0.2715810537,0.05000,0.270
7,self_attn.o_proj,0.0162299760,0.05000,0.572
7,mlp.gate_proj,0.9687359333,0.05000,0.274
7,mlp.up_proj,0.5892530084,0.05000,0.273
7,mlp.down_proj,0.0502672568,0.05000,0.836
8,self_attn.k_proj,0.1439509392,0.05000,0.272
8,self_attn.v_proj,0.1313253343,0.05000,0.268
8,self_attn.q_proj,0.3237347603,0.05000,0.270
8,self_attn.o_proj,0.0149488933,0.05000,0.542
8,mlp.gate_proj,0.9375967979,0.05000,0.271
8,mlp.up_proj,0.5916349888,0.05000,0.274
8,mlp.down_proj,0.0501379147,0.05000,0.821
9,self_attn.k_proj,0.2607176304,0.05000,0.270
9,self_attn.v_proj,0.2475461066,0.05000,0.272
9,self_attn.q_proj,0.6035818458,0.05000,0.269
9,self_attn.o_proj,0.0311477184,0.05000,0.538
9,mlp.gate_proj,1.0245599747,0.05000,0.271
9,mlp.up_proj,0.6295373440,0.05000,0.269
9,mlp.down_proj,0.0618912131,0.05000,0.818
10,self_attn.k_proj,0.2044563591,0.05000,0.271
10,self_attn.v_proj,0.2067638040,0.05000,0.275
10,self_attn.q_proj,0.4824802279,0.05000,0.270
10,self_attn.o_proj,0.0315365233,0.05000,0.539
10,mlp.gate_proj,1.0230076313,0.05000,0.276
10,mlp.up_proj,0.6350437403,0.05000,0.275
10,mlp.down_proj,0.0830124989,0.05000,0.831
11,self_attn.k_proj,0.3832934499,0.05000,0.272
11,self_attn.v_proj,0.3299685717,0.05000,0.273
11,self_attn.q_proj,0.9707468152,0.05000,0.276
11,self_attn.o_proj,0.0668854564,0.05000,0.537
11,mlp.gate_proj,0.7399315238,0.05000,0.274
11,mlp.up_proj,0.5590443611,0.05000,0.271
11,mlp.down_proj,0.0836513788,0.05000,0.824
12,self_attn.k_proj,0.3102838993,0.05000,0.268
12,self_attn.v_proj,0.3088186979,0.05000,0.272
12,self_attn.q_proj,0.8227573633,0.05000,0.515
12,self_attn.o_proj,0.0342148244,0.05000,0.536
12,mlp.gate_proj,0.6812306643,0.05000,0.273
12,mlp.up_proj,0.5542650223,0.05000,0.270
12,mlp.down_proj,0.0880227759,0.05000,0.816
13,self_attn.k_proj,0.3208425641,0.05000,0.271
13,self_attn.v_proj,0.3610678911,0.05000,0.271
13,self_attn.q_proj,0.9154192209,0.05000,0.271
13,self_attn.o_proj,0.0465078503,0.05000,0.541
13,mlp.gate_proj,0.7669239044,0.05000,0.274
13,mlp.up_proj,0.6116556525,0.05000,0.272
13,mlp.down_proj,0.0951566845,0.05000,0.815
14,self_attn.k_proj,0.4429032505,0.05000,0.270
14,self_attn.v_proj,0.4558904767,0.05000,0.269
14,self_attn.q_proj,1.1899302006,0.05000,0.271
14,self_attn.o_proj,0.0465852544,0.05000,0.539
14,mlp.gate_proj,0.7928631902,0.05000,0.273
14,mlp.up_proj,0.6356908083,0.05000,0.271
14,mlp.down_proj,0.1102237254,0.05000,0.813
15,self_attn.k_proj,0.7353894711,0.05000,0.269
15,self_attn.v_proj,0.8996654749,0.05000,0.275
15,self_attn.q_proj,2.2844204903,0.05000,0.277
15,self_attn.o_proj,0.0681514293,0.05000,0.546
15,mlp.gate_proj,0.9548274279,0.05000,0.271
15,mlp.up_proj,0.7745286226,0.05000,0.270
15,mlp.down_proj,0.1513546854,0.05000,0.809
16,self_attn.k_proj,1.0767021179,0.05000,0.271
16,self_attn.v_proj,0.9916024208,0.05000,0.275
16,self_attn.q_proj,3.0991945267,0.05000,0.275
16,self_attn.o_proj,0.0973514616,0.05000,0.542
16,mlp.gate_proj,1.0501160622,0.05000,0.270
16,mlp.up_proj,0.9404838085,0.05000,0.272
16,mlp.down_proj,0.3604103029,0.05000,0.813
17,self_attn.k_proj,2.4124805927,0.05000,0.273
17,self_attn.v_proj,2.8787002563,0.05000,0.270
17,self_attn.q_proj,7.4132294655,0.05000,0.271
17,self_attn.o_proj,0.2221524268,0.05000,0.544
17,mlp.gate_proj,1.6191822290,0.05000,0.272
17,mlp.up_proj,1.4351911545,0.05000,0.273
17,mlp.down_proj,0.4600560665,0.05000,0.816
18,self_attn.k_proj,2.4339659214,0.05000,0.270
18,self_attn.v_proj,2.6121122837,0.05000,0.272
18,self_attn.q_proj,7.7049455643,0.05000,0.267
18,self_attn.o_proj,0.1935115755,0.05000,0.535
18,mlp.gate_proj,2.0874688625,0.05000,0.271
18,mlp.up_proj,1.8297674656,0.05000,0.269
18,mlp.down_proj,0.8489264846,0.05000,0.810
19,self_attn.k_proj,4.2865271568,0.05000,0.267
19,self_attn.v_proj,5.3223285675,0.05000,0.266
19,self_attn.q_proj,14.3558692932,0.05000,0.268
19,self_attn.o_proj,0.3448703289,0.05000,0.536
19,mlp.gate_proj,2.2460441589,0.05000,0.267
19,mlp.up_proj,2.3563187122,0.05000,0.266
19,mlp.down_proj,1.4070756435,0.05000,0.814
20,self_attn.k_proj,6.4479541779,0.05000,0.268
20,self_attn.v_proj,7.3154568672,0.05000,0.267
20,self_attn.q_proj,19.4513092041,0.05000,0.269
20,self_attn.o_proj,0.4146451354,0.05000,0.535
20,mlp.gate_proj,2.5706572533,0.05000,0.270
20,mlp.up_proj,2.8989415169,0.05000,0.268
20,mlp.down_proj,1.9455537796,0.05000,0.809
21,self_attn.k_proj,11.4309139252,0.05000,0.270
21,self_attn.v_proj,13.4588928223,0.05000,0.269
21,self_attn.q_proj,33.1673202515,0.05000,0.271
21,self_attn.o_proj,0.6142717600,0.05000,0.536
21,mlp.gate_proj,3.0040376186,0.05000,0.269
21,mlp.up_proj,3.6499385834,0.05000,0.267
21,mlp.down_proj,2.9936137199,0.05000,0.810
22,self_attn.k_proj,13.1742839813,0.05000,0.267
22,self_attn.v_proj,17.1264152527,0.05000,0.267
22,self_attn.q_proj,37.4587974548,0.05000,0.268
22,self_attn.o_proj,0.8527563214,0.05000,0.533
22,mlp.gate_proj,3.4767191410,0.05000,0.271
22,mlp.up_proj,4.3843421936,0.05000,0.269
22,mlp.down_proj,3.9900336266,0.05000,0.848
23,self_attn.k_proj,17.5688858032,0.05000,0.267
23,self_attn.v_proj,20.2590312958,0.05000,0.267
23,self_attn.q_proj,42.3259162903,0.05000,0.270
23,self_attn.o_proj,0.9686302543,0.05000,0.533
23,mlp.gate_proj,3.8405270576,0.05000,0.273
23,mlp.up_proj,5.0237965584,0.05000,0.269
23,mlp.down_proj,4.2359795570,0.05000,1.067
24,self_attn.k_proj,28.6652069092,0.05000,0.271
24,self_attn.v_proj,31.3004150391,0.05000,0.266
24,self_attn.q_proj,80.2267913818,0.05000,0.268
24,self_attn.o_proj,1.1186426878,0.05000,0.541
24,mlp.gate_proj,3.6467981339,0.05000,0.271
24,mlp.up_proj,4.9967317581,0.05000,0.269
24,mlp.down_proj,5.0153646469,0.05000,0.818
25,self_attn.k_proj,34.1952438354,0.05000,0.268
25,self_attn.v_proj,52.2172927856,0.05000,0.268
25,self_attn.q_proj,102.7100524902,0.05000,0.267
25,self_attn.o_proj,1.4557044506,0.05000,0.544
25,mlp.gate_proj,3.5655152798,0.05000,0.271
25,mlp.up_proj,5.1156783104,0.05000,0.266
25,mlp.down_proj,6.0685262680,0.05000,0.818
26,self_attn.k_proj,33.4326934814,0.05000,0.270
26,self_attn.v_proj,48.4014549255,0.05000,0.269
26,self_attn.q_proj,111.4053268433,0.05000,0.270
26,self_attn.o_proj,3.3541142941,0.05000,0.532
26,mlp.gate_proj,3.8577950001,0.05000,0.269
26,mlp.up_proj,5.3475961685,0.05000,0.267
26,mlp.down_proj,11.5380468369,0.05000,0.810
27,self_attn.k_proj,31.9528331757,0.05000,0.270
27,self_attn.v_proj,38.4808578491,0.05000,0.272
27,self_attn.q_proj,70.9194641113,0.05000,0.268
27,self_attn.o_proj,2.9374377728,0.05000,0.532
27,mlp.gate_proj,17.0734329224,0.05000,0.267
27,mlp.up_proj,17.2442932129,0.05000,0.266
27,mlp.down_proj,24.1500759125,0.05000,0.809