Mistral-7b-V3-IT-code-0.3 / quant_log.csv
Devbora29's picture
Upload folder using huggingface_hub
35a3179 verified
Raw
History Blame Contribute Delete
10.4 kB
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000000045,0.05000,4.840
0,self_attn.v_proj,0.0000000004,0.05000,5.288
0,self_attn.q_proj,0.0000000150,0.05000,5.068
0,self_attn.o_proj,0.0000000000,0.05000,1.513
0,mlp.up_proj,0.0000000142,0.05000,2.825
0,mlp.gate_proj,0.0000000164,0.05000,2.834
0,mlp.down_proj,0.0000000000,0.05000,5.910
1,self_attn.q_proj,0.0000000452,0.05000,4.740
1,self_attn.k_proj,0.0000000208,0.05000,4.753
1,self_attn.v_proj,0.0000000034,0.05000,4.794
1,self_attn.o_proj,0.0000000000,0.05000,1.628
1,mlp.up_proj,0.0000000480,0.05000,2.837
1,mlp.gate_proj,0.0000000548,0.05000,2.865
1,mlp.down_proj,0.0000000073,0.05000,5.963
2,self_attn.k_proj,0.0000001725,0.05000,4.514
2,self_attn.q_proj,0.0000003553,0.05000,4.526
2,self_attn.v_proj,0.0000000225,0.05000,4.536
2,self_attn.o_proj,0.0000000000,0.05000,2.101
2,mlp.up_proj,0.0000001006,0.05000,2.791
2,mlp.gate_proj,0.0000001153,0.05000,2.805
2,mlp.down_proj,0.0000000000,0.05000,5.912
3,self_attn.v_proj,0.0000000155,0.05000,4.692
3,self_attn.q_proj,0.0000001928,0.05000,4.718
3,self_attn.k_proj,0.0000000937,0.05000,4.730
3,self_attn.o_proj,0.0000000000,0.05000,1.556
3,mlp.gate_proj,0.0000001922,0.05000,2.877
3,mlp.up_proj,0.0000001660,0.05000,2.891
3,mlp.down_proj,0.0000000001,0.05000,5.870
4,self_attn.k_proj,0.0000001324,0.05000,4.821
4,self_attn.q_proj,0.0000003002,0.05000,4.843
4,self_attn.v_proj,0.0000000261,0.05000,4.850
4,self_attn.o_proj,0.0000000000,0.05000,1.527
4,mlp.gate_proj,0.0000002774,0.05000,2.827
4,mlp.up_proj,0.0000002246,0.05000,2.837
4,mlp.down_proj,0.0000000001,0.05000,5.955
5,self_attn.k_proj,0.0000001730,0.05000,4.897
5,self_attn.v_proj,0.0000000291,0.05000,4.904
5,self_attn.q_proj,0.0000003899,0.05000,4.909
5,self_attn.o_proj,0.0000000001,0.05000,1.577
5,mlp.up_proj,0.0000002912,0.05000,2.816
5,mlp.gate_proj,0.0000003836,0.05000,2.831
5,mlp.down_proj,0.0000000003,0.05000,5.922
6,self_attn.q_proj,0.0000003636,0.05000,4.775
6,self_attn.k_proj,0.0000001706,0.05000,4.862
6,self_attn.v_proj,0.0000000294,0.05000,4.873
6,self_attn.o_proj,0.0000000001,0.05000,1.533
6,mlp.up_proj,0.0000003460,0.05000,2.797
6,mlp.gate_proj,0.0000004451,0.05000,2.797
6,mlp.down_proj,0.0000000004,0.05000,5.935
7,self_attn.v_proj,0.0000000391,0.05000,4.774
7,self_attn.q_proj,0.0000004503,0.05000,4.793
7,self_attn.k_proj,0.0000002152,0.05000,4.811
7,self_attn.o_proj,0.0000000001,0.05000,1.568
7,mlp.up_proj,0.0000004005,0.05000,2.814
7,mlp.gate_proj,0.0000005274,0.05000,2.818
7,mlp.down_proj,0.0000000005,0.05000,5.941
8,self_attn.k_proj,0.0000001697,0.05000,4.593
8,self_attn.q_proj,0.0000003730,0.05000,4.593
8,self_attn.v_proj,0.0000000364,0.05000,4.615
8,self_attn.o_proj,0.0000000002,0.05000,1.552
8,mlp.gate_proj,0.0000005689,0.05000,2.832
8,mlp.up_proj,0.0000004404,0.05000,2.842
8,mlp.down_proj,0.0000000005,0.05000,5.915
9,self_attn.q_proj,0.0000005147,0.05000,4.651
9,self_attn.v_proj,0.0000000435,0.05000,4.676
9,self_attn.k_proj,0.0000002410,0.05000,4.684
9,self_attn.o_proj,0.0000000002,0.05000,1.546
9,mlp.gate_proj,0.0000005988,0.05000,2.826
9,mlp.up_proj,0.0000004793,0.05000,2.834
9,mlp.down_proj,0.0000000007,0.05000,5.961
10,self_attn.k_proj,0.0000002164,0.05000,4.770
10,self_attn.q_proj,0.0000004548,0.05000,4.779
10,self_attn.v_proj,0.0000000379,0.05000,4.786
10,self_attn.o_proj,0.0000000003,0.05000,1.531
10,mlp.gate_proj,0.0000006227,0.05000,2.837
10,mlp.up_proj,0.0000005106,0.05000,2.848
10,mlp.down_proj,0.0000000008,0.05000,5.918
11,self_attn.k_proj,0.0000002533,0.05000,4.929
11,self_attn.q_proj,0.0000005502,0.05000,5.001
11,self_attn.v_proj,0.0000000559,0.05000,5.031
11,self_attn.o_proj,0.0000000004,0.05000,1.540
11,mlp.gate_proj,0.0000006790,0.05000,2.822
11,mlp.up_proj,0.0000005648,0.05000,2.831
11,mlp.down_proj,0.0000000009,0.05000,5.917
12,self_attn.q_proj,0.0000007278,0.05000,4.785
12,self_attn.v_proj,0.0000000635,0.05000,4.804
12,self_attn.k_proj,0.0000003287,0.05000,4.831
12,self_attn.o_proj,0.0000000004,0.05000,1.534
12,mlp.gate_proj,0.0000007479,0.05000,2.831
12,mlp.up_proj,0.0000006364,0.05000,2.836
12,mlp.down_proj,0.0000000011,0.05000,5.979
13,self_attn.k_proj,0.0000002807,0.05000,4.666
13,self_attn.q_proj,0.0000005740,0.05000,4.694
13,self_attn.v_proj,0.0000000607,0.05000,4.704
13,self_attn.o_proj,0.0000000006,0.05000,1.560
13,mlp.gate_proj,0.0000008370,0.05000,2.828
13,mlp.up_proj,0.0000007320,0.05000,2.845
13,mlp.down_proj,0.0000000013,0.05000,5.919
14,self_attn.q_proj,0.0000006548,0.05000,4.817
14,self_attn.v_proj,0.0000000978,0.05000,4.860
14,self_attn.k_proj,0.0000002809,0.05000,4.864
14,self_attn.o_proj,0.0000000007,0.05000,1.548
14,mlp.gate_proj,0.0000009377,0.05000,2.863
14,mlp.up_proj,0.0000008157,0.05000,2.875
14,mlp.down_proj,0.0000000017,0.05000,5.917
15,self_attn.k_proj,0.0000003675,0.05000,4.802
15,self_attn.v_proj,0.0000001112,0.05000,4.832
15,self_attn.q_proj,0.0000008244,0.05000,4.842
15,self_attn.o_proj,0.0000000008,0.05000,1.565
15,mlp.gate_proj,0.0000010717,0.05000,2.820
15,mlp.up_proj,0.0000009010,0.05000,2.821
15,mlp.down_proj,0.0000000022,0.05000,5.900
16,self_attn.k_proj,0.0000003414,0.05000,4.800
16,self_attn.q_proj,0.0000007387,0.05000,4.826
16,self_attn.v_proj,0.0000001060,0.05000,4.831
16,self_attn.o_proj,0.0000000009,0.05000,1.555
16,mlp.up_proj,0.0000010571,0.05000,2.796
16,mlp.gate_proj,0.0000013285,0.05000,2.804
16,mlp.down_proj,0.0000000031,0.05000,5.935
17,self_attn.v_proj,0.0000001007,0.05000,4.906
17,self_attn.k_proj,0.0000002850,0.05000,4.927
17,self_attn.q_proj,0.0000006805,0.05000,4.970
17,self_attn.o_proj,0.0000000011,0.05000,1.555
17,mlp.up_proj,0.0000012283,0.05000,2.795
17,mlp.gate_proj,0.0000015413,0.05000,2.803
17,mlp.down_proj,0.0000000043,0.05000,5.859
18,self_attn.v_proj,0.0000001238,0.05000,4.658
18,self_attn.k_proj,0.0000003386,0.05000,4.669
18,self_attn.q_proj,0.0000008637,0.05000,4.682
18,self_attn.o_proj,0.0000000011,0.05000,1.535
18,mlp.up_proj,0.0000013842,0.05000,2.782
18,mlp.gate_proj,0.0000017367,0.05000,2.792
18,mlp.down_proj,0.0000000061,0.05000,5.917
19,self_attn.k_proj,0.0000003408,0.05000,4.715
19,self_attn.q_proj,0.0000007988,0.05000,4.776
19,self_attn.v_proj,0.0000001450,0.05000,4.783
19,self_attn.o_proj,0.0000000013,0.05000,1.550
19,mlp.up_proj,0.0000015377,0.05000,2.835
19,mlp.gate_proj,0.0000019642,0.05000,2.851
19,mlp.down_proj,0.0000000081,0.05000,5.902
20,self_attn.v_proj,0.0000460283,0.05000,4.815
20,self_attn.q_proj,0.0002501937,0.05000,4.853
20,self_attn.k_proj,0.0001023333,0.05000,4.865
20,self_attn.o_proj,0.0000003618,0.05000,1.536
20,mlp.up_proj,0.0004975359,0.05000,2.848
20,mlp.gate_proj,0.0006521194,0.05000,2.854
20,mlp.down_proj,0.0000025065,0.05000,5.928
21,self_attn.k_proj,0.0001006711,0.05000,4.614
21,self_attn.v_proj,0.0000486894,0.05000,4.634
21,self_attn.q_proj,0.0002477611,0.05000,4.647
21,self_attn.o_proj,0.0000003476,0.05000,1.568
21,mlp.gate_proj,0.0007708430,0.05000,2.823
21,mlp.up_proj,0.0005485023,0.05000,2.831
21,mlp.down_proj,0.0000025757,0.05000,5.958
22,self_attn.v_proj,0.0000507348,0.05000,4.733
22,self_attn.q_proj,0.0002405264,0.05000,4.754
22,self_attn.k_proj,0.0000960108,0.05000,4.761
22,self_attn.o_proj,0.0000002108,0.05000,1.536
22,mlp.up_proj,0.0005943207,0.05000,2.806
22,mlp.gate_proj,0.0008269122,0.05000,2.810
22,mlp.down_proj,0.0000027136,0.05000,5.895
23,self_attn.k_proj,0.0000954055,0.05000,4.678
23,self_attn.q_proj,0.0002420283,0.05000,4.711
23,self_attn.v_proj,0.0000532537,0.05000,4.729
23,self_attn.o_proj,0.0000003501,0.05000,1.521
23,mlp.up_proj,0.0006547531,0.05000,2.851
23,mlp.gate_proj,0.0009137075,0.05000,2.879
23,mlp.down_proj,0.0000030363,0.05000,5.912
24,self_attn.v_proj,0.0000622052,0.05000,4.498
24,self_attn.k_proj,0.0001111750,0.05000,4.528
24,self_attn.q_proj,0.0002778825,0.05000,4.554
24,self_attn.o_proj,0.0000003277,0.05000,1.578
24,mlp.up_proj,0.0007254657,0.05000,2.841
24,mlp.gate_proj,0.0010315949,0.05000,2.861
24,mlp.down_proj,0.0000033368,0.05000,5.904
25,self_attn.v_proj,0.0000711914,0.05000,4.562
25,self_attn.k_proj,0.0001072556,0.05000,4.586
25,self_attn.q_proj,0.0002790395,0.05000,4.612
25,self_attn.o_proj,0.0000003792,0.05000,1.566
25,mlp.gate_proj,0.0011210348,0.05000,2.902
25,mlp.up_proj,0.0007955477,0.05000,2.907
25,mlp.down_proj,0.0000038278,0.05000,5.972
26,self_attn.v_proj,0.0000751634,0.05000,4.598
26,self_attn.k_proj,0.0001005206,0.05000,4.633
26,self_attn.q_proj,0.0002639526,0.05000,4.640
26,self_attn.o_proj,0.0000004955,0.05000,1.556
26,mlp.up_proj,0.0008637970,0.05000,2.815
26,mlp.gate_proj,0.0011751253,0.05000,2.820
26,mlp.down_proj,0.0000043847,0.05000,5.919
27,self_attn.v_proj,0.0000680719,0.05000,4.600
27,self_attn.k_proj,0.0001012717,0.05000,4.649
27,self_attn.q_proj,0.0002717224,0.05000,4.657
27,self_attn.o_proj,0.0000005582,0.05000,1.540
27,mlp.gate_proj,0.0012836707,0.05000,2.818
27,mlp.up_proj,0.0009500155,0.05000,2.832
27,mlp.down_proj,0.0000051473,0.05000,5.936
28,self_attn.q_proj,0.0002645630,0.05000,4.639
28,self_attn.k_proj,0.0001015999,0.05000,4.661
28,self_attn.v_proj,0.0000992078,0.05000,4.686
28,self_attn.o_proj,0.0000008682,0.05000,1.564
28,mlp.gate_proj,0.0013713280,0.05000,2.813
28,mlp.up_proj,0.0010524418,0.05000,2.818
28,mlp.down_proj,0.0000069629,0.05000,5.921
29,self_attn.v_proj,0.0001436985,0.05000,4.504
29,self_attn.k_proj,0.0001024819,0.05000,4.512
29,self_attn.q_proj,0.0003024004,0.05000,4.519
29,self_attn.o_proj,0.0000018162,0.05000,1.541
29,mlp.gate_proj,0.0013321182,0.05000,2.801
29,mlp.up_proj,0.0010659065,0.05000,2.823
29,mlp.down_proj,0.0000087815,0.05000,5.863
30,self_attn.v_proj,0.0000005463,0.05000,4.492
30,self_attn.k_proj,0.0000003260,0.05000,4.527
30,self_attn.q_proj,0.0000009703,0.05000,4.532
30,self_attn.o_proj,0.0000000055,0.05000,1.522
30,mlp.gate_proj,0.0000046290,0.05000,2.849
30,mlp.up_proj,0.0000037689,0.05000,2.855
30,mlp.down_proj,0.0000000387,0.05000,5.934
31,self_attn.k_proj,0.0000003091,0.05000,4.778
31,self_attn.q_proj,0.0000009006,0.05000,4.797
31,self_attn.v_proj,0.0000005541,0.05000,4.808
31,self_attn.o_proj,0.0000000074,0.05000,1.543
31,mlp.up_proj,0.0000029935,0.05000,2.817
31,mlp.gate_proj,0.0000037887,0.05000,2.823
31,mlp.down_proj,0.0000000543,0.05000,5.876