Mistral-7b-V3-IT-code-0.5 / quant_log.csv
Devbora29's picture
Upload folder using huggingface_hub
3c2ef8e verified
Raw
History Blame Contribute Delete
10.4 kB
layer,module,loss,samples,damp,time
0,self_attn.v_proj,0.0000000004,0.05000,4.879
0,self_attn.q_proj,0.0000000150,0.05000,4.920
0,self_attn.k_proj,0.0000000045,0.05000,4.920
0,self_attn.o_proj,0.0000000000,0.05000,1.541
0,mlp.up_proj,0.0000000142,0.05000,2.767
0,mlp.gate_proj,0.0000000164,0.05000,2.788
0,mlp.down_proj,0.0000000000,0.05000,5.935
1,self_attn.q_proj,0.0000000452,0.05000,5.686
1,self_attn.k_proj,0.0000000208,0.05000,5.717
1,self_attn.v_proj,0.0000000034,0.05000,5.753
1,self_attn.o_proj,0.0000000000,0.05000,1.558
1,mlp.gate_proj,0.0000000548,0.05000,2.780
1,mlp.up_proj,0.0000000480,0.05000,2.812
1,mlp.down_proj,0.0000000073,0.05000,5.981
2,self_attn.q_proj,0.0000003553,0.05000,5.404
2,self_attn.v_proj,0.0000000225,0.05000,5.422
2,self_attn.k_proj,0.0000001725,0.05000,5.441
2,self_attn.o_proj,0.0000000000,0.05000,1.573
2,mlp.gate_proj,0.0000001153,0.05000,2.787
2,mlp.up_proj,0.0000001006,0.05000,2.788
2,mlp.down_proj,0.0000000000,0.05000,5.971
3,self_attn.k_proj,0.0000000937,0.05000,5.724
3,self_attn.v_proj,0.0000000155,0.05000,5.736
3,self_attn.q_proj,0.0000001928,0.05000,5.763
3,self_attn.o_proj,0.0000000000,0.05000,1.568
3,mlp.up_proj,0.0000001660,0.05000,2.751
3,mlp.gate_proj,0.0000001922,0.05000,2.756
3,mlp.down_proj,0.0000000001,0.05000,6.016
4,self_attn.q_proj,0.0000003002,0.05000,5.606
4,self_attn.k_proj,0.0000001324,0.05000,5.636
4,self_attn.v_proj,0.0000000261,0.05000,5.673
4,self_attn.o_proj,0.0000000000,0.05000,1.554
4,mlp.gate_proj,0.0000002774,0.05000,2.768
4,mlp.up_proj,0.0000002246,0.05000,2.775
4,mlp.down_proj,0.0000000001,0.05000,6.006
5,self_attn.q_proj,0.0000003899,0.05000,5.595
5,self_attn.v_proj,0.0000000291,0.05000,5.614
5,self_attn.k_proj,0.0000001730,0.05000,5.617
5,self_attn.o_proj,0.0000000001,0.05000,1.574
5,mlp.gate_proj,0.0000003836,0.05000,2.772
5,mlp.up_proj,0.0000002912,0.05000,2.784
5,mlp.down_proj,0.0000000003,0.05000,6.005
6,self_attn.k_proj,0.0000001706,0.05000,5.528
6,self_attn.v_proj,0.0000000294,0.05000,5.586
6,self_attn.q_proj,0.0000003636,0.05000,5.630
6,self_attn.o_proj,0.0000000001,0.05000,1.573
6,mlp.gate_proj,0.0000004451,0.05000,2.861
6,mlp.up_proj,0.0000003460,0.05000,2.881
6,mlp.down_proj,0.0000000004,0.05000,6.009
7,self_attn.v_proj,0.0000000391,0.05000,5.708
7,self_attn.k_proj,0.0000002152,0.05000,5.739
7,self_attn.q_proj,0.0000004503,0.05000,5.761
7,self_attn.o_proj,0.0000000001,0.05000,1.558
7,mlp.up_proj,0.0000004005,0.05000,2.803
7,mlp.gate_proj,0.0000005274,0.05000,2.822
7,mlp.down_proj,0.0000000005,0.05000,6.020
8,self_attn.v_proj,0.0000000364,0.05000,5.675
8,self_attn.k_proj,0.0000001697,0.05000,5.686
8,self_attn.q_proj,0.0000003730,0.05000,5.700
8,self_attn.o_proj,0.0000000002,0.05000,1.551
8,mlp.gate_proj,0.0000005689,0.05000,2.796
8,mlp.up_proj,0.0000004404,0.05000,2.803
8,mlp.down_proj,0.0000000005,0.05000,5.992
9,self_attn.v_proj,0.0000000435,0.05000,5.665
9,self_attn.q_proj,0.0000005147,0.05000,5.700
9,self_attn.k_proj,0.0000002410,0.05000,5.705
9,self_attn.o_proj,0.0000000002,0.05000,1.557
9,mlp.gate_proj,0.0000005988,0.05000,2.784
9,mlp.up_proj,0.0000004793,0.05000,2.792
9,mlp.down_proj,0.0000000007,0.05000,5.989
10,self_attn.q_proj,0.0000004548,0.05000,5.268
10,self_attn.v_proj,0.0000000379,0.05000,5.291
10,self_attn.k_proj,0.0000002164,0.05000,5.309
10,self_attn.o_proj,0.0000000003,0.05000,1.565
10,mlp.up_proj,0.0000005106,0.05000,2.780
10,mlp.gate_proj,0.0000006227,0.05000,2.789
10,mlp.down_proj,0.0000000008,0.05000,5.958
11,self_attn.v_proj,0.0000000559,0.05000,5.584
11,self_attn.k_proj,0.0000002533,0.05000,5.600
11,self_attn.q_proj,0.0000005502,0.05000,5.626
11,self_attn.o_proj,0.0000000004,0.05000,1.522
11,mlp.up_proj,0.0000005648,0.05000,2.815
11,mlp.gate_proj,0.0000006790,0.05000,2.825
11,mlp.down_proj,0.0000000009,0.05000,6.012
12,self_attn.q_proj,0.0000007278,0.05000,5.495
12,self_attn.v_proj,0.0000000635,0.05000,5.547
12,self_attn.k_proj,0.0000003287,0.05000,5.564
12,self_attn.o_proj,0.0000000004,0.05000,1.548
12,mlp.up_proj,0.0000006364,0.05000,2.785
12,mlp.gate_proj,0.0000007479,0.05000,2.796
12,mlp.down_proj,0.0000000011,0.05000,5.937
13,self_attn.q_proj,0.0000005740,0.05000,5.754
13,self_attn.k_proj,0.0000002807,0.05000,5.812
13,self_attn.v_proj,0.0000000607,0.05000,5.828
13,self_attn.o_proj,0.0000000006,0.05000,1.556
13,mlp.gate_proj,0.0000008370,0.05000,2.780
13,mlp.up_proj,0.0000007320,0.05000,2.790
13,mlp.down_proj,0.0000000013,0.05000,5.960
14,self_attn.v_proj,0.0000000978,0.05000,5.400
14,self_attn.k_proj,0.0000002809,0.05000,5.464
14,self_attn.q_proj,0.0000006548,0.05000,5.490
14,self_attn.o_proj,0.0000000007,0.05000,1.586
14,mlp.gate_proj,0.0000009377,0.05000,2.823
14,mlp.up_proj,0.0000008157,0.05000,2.830
14,mlp.down_proj,0.0000000017,0.05000,5.987
15,self_attn.q_proj,0.0000008244,0.05000,5.573
15,self_attn.v_proj,0.0000001112,0.05000,5.588
15,self_attn.k_proj,0.0000003675,0.05000,5.609
15,self_attn.o_proj,0.0000000008,0.05000,1.566
15,mlp.gate_proj,0.0000010717,0.05000,2.808
15,mlp.up_proj,0.0000009010,0.05000,2.818
15,mlp.down_proj,0.0000000022,0.05000,5.975
16,self_attn.k_proj,0.0000003414,0.05000,5.454
16,self_attn.q_proj,0.0000007387,0.05000,5.480
16,self_attn.v_proj,0.0000001060,0.05000,5.509
16,self_attn.o_proj,0.0000000009,0.05000,1.547
16,mlp.gate_proj,0.0000013285,0.05000,2.811
16,mlp.up_proj,0.0000010571,0.05000,2.817
16,mlp.down_proj,0.0000000031,0.05000,5.919
17,self_attn.k_proj,0.0000002850,0.05000,5.686
17,self_attn.v_proj,0.0000001007,0.05000,5.715
17,self_attn.q_proj,0.0000006805,0.05000,5.725
17,self_attn.o_proj,0.0000000011,0.05000,1.541
17,mlp.up_proj,0.0000012283,0.05000,2.767
17,mlp.gate_proj,0.0000015413,0.05000,2.776
17,mlp.down_proj,0.0000000043,0.05000,5.974
18,self_attn.v_proj,0.0000001238,0.05000,5.556
18,self_attn.q_proj,0.0000008637,0.05000,5.607
18,self_attn.k_proj,0.0000003386,0.05000,5.626
18,self_attn.o_proj,0.0000000011,0.05000,1.556
18,mlp.gate_proj,0.0000017367,0.05000,2.802
18,mlp.up_proj,0.0000013842,0.05000,2.808
18,mlp.down_proj,0.0000000061,0.05000,5.951
19,self_attn.v_proj,0.0000001450,0.05000,5.642
19,self_attn.k_proj,0.0000003408,0.05000,5.663
19,self_attn.q_proj,0.0000007988,0.05000,5.674
19,self_attn.o_proj,0.0000000013,0.05000,1.604
19,mlp.gate_proj,0.0000019642,0.05000,2.772
19,mlp.up_proj,0.0000015377,0.05000,2.790
19,mlp.down_proj,0.0000000081,0.05000,5.997
20,self_attn.v_proj,0.0000460283,0.05000,5.376
20,self_attn.k_proj,0.0001023333,0.05000,5.450
20,self_attn.q_proj,0.0002501937,0.05000,5.460
20,self_attn.o_proj,0.0000003618,0.05000,1.531
20,mlp.up_proj,0.0004975359,0.05000,2.774
20,mlp.gate_proj,0.0006521194,0.05000,2.779
20,mlp.down_proj,0.0000025065,0.05000,5.931
21,self_attn.q_proj,0.0002477611,0.05000,5.504
21,self_attn.v_proj,0.0000486894,0.05000,5.527
21,self_attn.k_proj,0.0001006711,0.05000,5.532
21,self_attn.o_proj,0.0000003476,0.05000,1.553
21,mlp.gate_proj,0.0007708430,0.05000,2.834
21,mlp.up_proj,0.0005485023,0.05000,2.842
21,mlp.down_proj,0.0000025757,0.05000,5.948
22,self_attn.k_proj,0.0000960108,0.05000,5.470
22,self_attn.v_proj,0.0000507348,0.05000,5.527
22,self_attn.q_proj,0.0002405264,0.05000,5.538
22,self_attn.o_proj,0.0000002108,0.05000,1.560
22,mlp.gate_proj,0.0008269122,0.05000,2.758
22,mlp.up_proj,0.0005943207,0.05000,2.774
22,mlp.down_proj,0.0000027136,0.05000,5.973
23,self_attn.k_proj,0.0000954055,0.05000,5.533
23,self_attn.q_proj,0.0002420283,0.05000,5.626
23,self_attn.v_proj,0.0000532537,0.05000,5.632
23,self_attn.o_proj,0.0000003501,0.05000,1.542
23,mlp.gate_proj,0.0009137075,0.05000,2.776
23,mlp.up_proj,0.0006547531,0.05000,2.791
23,mlp.down_proj,0.0000030363,0.05000,5.945
24,self_attn.v_proj,0.0000622052,0.05000,5.253
24,self_attn.k_proj,0.0001111750,0.05000,5.364
24,self_attn.q_proj,0.0002778825,0.05000,5.381
24,self_attn.o_proj,0.0000003277,0.05000,1.549
24,mlp.gate_proj,0.0010315949,0.05000,2.772
24,mlp.up_proj,0.0007254657,0.05000,2.776
24,mlp.down_proj,0.0000033368,0.05000,5.985
25,self_attn.q_proj,0.0002790395,0.05000,5.293
25,self_attn.k_proj,0.0001072556,0.05000,5.306
25,self_attn.v_proj,0.0000711914,0.05000,5.348
25,self_attn.o_proj,0.0000003792,0.05000,1.548
25,mlp.gate_proj,0.0011210348,0.05000,2.794
25,mlp.up_proj,0.0007955477,0.05000,2.800
25,mlp.down_proj,0.0000038278,0.05000,5.962
26,self_attn.k_proj,0.0001005206,0.05000,5.340
26,self_attn.v_proj,0.0000751634,0.05000,5.363
26,self_attn.q_proj,0.0002639526,0.05000,5.399
26,self_attn.o_proj,0.0000004955,0.05000,1.543
26,mlp.gate_proj,0.0011751253,0.05000,2.736
26,mlp.up_proj,0.0008637970,0.05000,2.749
26,mlp.down_proj,0.0000043847,0.05000,5.972
27,self_attn.v_proj,0.0000680719,0.05000,5.472
27,self_attn.k_proj,0.0001012717,0.05000,5.603
27,self_attn.q_proj,0.0002717224,0.05000,5.640
27,self_attn.o_proj,0.0000005582,0.05000,1.565
27,mlp.up_proj,0.0009500155,0.05000,2.771
27,mlp.gate_proj,0.0012836707,0.05000,2.789
27,mlp.down_proj,0.0000051473,0.05000,5.936
28,self_attn.v_proj,0.0000992078,0.05000,5.279
28,self_attn.q_proj,0.0002645630,0.05000,5.304
28,self_attn.k_proj,0.0001015999,0.05000,5.323
28,self_attn.o_proj,0.0000008682,0.05000,1.565
28,mlp.up_proj,0.0010524418,0.05000,2.756
28,mlp.gate_proj,0.0013713280,0.05000,2.756
28,mlp.down_proj,0.0000069629,0.05000,5.935
29,self_attn.q_proj,0.0003024004,0.05000,5.304
29,self_attn.v_proj,0.0001436985,0.05000,5.320
29,self_attn.k_proj,0.0001024819,0.05000,5.347
29,self_attn.o_proj,0.0000018162,0.05000,1.534
29,mlp.gate_proj,0.0013321182,0.05000,2.757
29,mlp.up_proj,0.0010659065,0.05000,2.770
29,mlp.down_proj,0.0000087815,0.05000,5.935
30,self_attn.k_proj,0.0000003260,0.05000,5.367
30,self_attn.q_proj,0.0000009703,0.05000,5.382
30,self_attn.v_proj,0.0000005463,0.05000,5.396
30,self_attn.o_proj,0.0000000055,0.05000,1.542
30,mlp.up_proj,0.0000037689,0.05000,2.758
30,mlp.gate_proj,0.0000046290,0.05000,2.762
30,mlp.down_proj,0.0000000387,0.05000,5.944
31,self_attn.v_proj,0.0000005541,0.05000,5.782
31,self_attn.q_proj,0.0000009006,0.05000,5.797
31,self_attn.k_proj,0.0000003091,0.05000,5.814
31,self_attn.o_proj,0.0000000074,0.05000,1.541
31,mlp.gate_proj,0.0000037887,0.05000,2.776
31,mlp.up_proj,0.0000029935,0.05000,2.782
31,mlp.down_proj,0.0000000543,0.05000,5.973