viveksil's picture
Add files using upload-large-folder tool
00b2f1e verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00022096,0.01000,1.099
0,self_attn.v_proj,0.00000229,0.01000,2.435
0,self_attn.q_proj,0.00036210,0.01000,2.448
0,self_attn.o_proj,0.00000175,0.01000,2.415
0,mlp.up_proj,0.00150737,0.01000,1.416
0,mlp.gate_proj,0.00142441,0.01000,0.274
0,mlp.down_proj,0.00595958,0.01000,0.739
1,self_attn.k_proj,0.00078274,0.01000,0.286
1,self_attn.v_proj,0.00015115,0.01000,0.272
1,self_attn.q_proj,0.00174118,0.01000,0.162
1,self_attn.o_proj,0.00103411,0.01000,0.769
1,mlp.up_proj,0.00179594,0.01000,1.660
1,mlp.gate_proj,0.00228291,0.01000,0.973
1,mlp.down_proj,0.00224895,0.01000,0.746
2,self_attn.k_proj,0.00125878,0.01000,0.437
2,self_attn.v_proj,0.00020735,0.01000,0.269
2,self_attn.q_proj,0.00295782,0.01000,0.638
2,self_attn.o_proj,0.00098028,0.01000,0.810
2,mlp.up_proj,0.00240148,0.01000,0.318
2,mlp.gate_proj,0.00286920,0.01000,0.260
2,mlp.down_proj,0.00500130,0.01000,6.505
3,self_attn.k_proj,0.00188067,0.01000,1.197
3,self_attn.v_proj,0.00074529,0.01000,0.289
3,self_attn.q_proj,0.00454102,0.01000,0.292
3,self_attn.o_proj,0.00114469,0.01000,0.283
3,mlp.up_proj,0.00272536,0.01000,0.309
3,mlp.gate_proj,0.00309045,0.01000,0.279
3,mlp.down_proj,0.00337280,0.01000,0.736
4,self_attn.k_proj,0.00178011,0.01000,0.471
4,self_attn.v_proj,0.00069859,0.01000,0.149
4,self_attn.q_proj,0.00427734,0.01000,0.145
4,self_attn.o_proj,0.00194755,0.01000,1.499
4,mlp.up_proj,0.00357304,0.01000,0.308
4,mlp.gate_proj,0.00408032,0.01000,0.289
4,mlp.down_proj,0.00474062,0.01000,0.744
5,self_attn.k_proj,0.00194141,0.01000,0.269
5,self_attn.v_proj,0.00072606,0.01000,0.919
5,self_attn.q_proj,0.00453751,0.01000,1.476
5,self_attn.o_proj,0.00234540,0.01000,0.281
5,mlp.up_proj,0.00409303,0.01000,0.266
5,mlp.gate_proj,0.00449629,0.01000,0.596
5,mlp.down_proj,0.00556781,0.01000,6.516
6,self_attn.k_proj,0.00163071,0.01000,0.275
6,self_attn.v_proj,0.00068974,0.01000,0.287
6,self_attn.q_proj,0.00406556,0.01000,0.276
6,self_attn.o_proj,0.00182722,0.01000,0.284
6,mlp.up_proj,0.00438432,0.01000,0.273
6,mlp.gate_proj,0.00448065,0.01000,0.271
6,mlp.down_proj,0.00687783,0.01000,0.819
7,self_attn.k_proj,0.00229149,0.01000,0.366
7,self_attn.v_proj,0.00139370,0.01000,0.148
7,self_attn.q_proj,0.00637256,0.01000,0.142
7,self_attn.o_proj,0.00216803,0.01000,1.421
7,mlp.up_proj,0.00479016,0.01000,0.280
7,mlp.gate_proj,0.00473948,0.01000,0.287
7,mlp.down_proj,0.00823352,0.01000,0.831
8,self_attn.k_proj,0.00214538,0.01000,1.666
8,self_attn.v_proj,0.00103131,0.01000,1.952
8,self_attn.q_proj,0.00540090,0.01000,1.636
8,self_attn.o_proj,0.00283757,0.01000,0.303
8,mlp.up_proj,0.00546549,0.01000,0.274
8,mlp.gate_proj,0.00495393,0.01000,0.275
8,mlp.down_proj,0.01154038,0.01000,6.464
9,self_attn.k_proj,0.00147208,0.01000,1.818
9,self_attn.v_proj,0.00058141,0.01000,1.731
9,self_attn.q_proj,0.00394661,0.01000,1.675
9,self_attn.o_proj,0.00251221,0.01000,0.324
9,mlp.up_proj,0.00595842,0.01000,0.347
9,mlp.gate_proj,0.00489875,0.01000,0.343
9,mlp.down_proj,0.01428184,0.01000,0.904
10,self_attn.k_proj,0.00132155,0.01000,2.685
10,self_attn.v_proj,0.00068617,0.01000,2.503
10,self_attn.q_proj,0.00363028,0.01000,1.752
10,self_attn.o_proj,0.00545926,0.01000,0.408
10,mlp.up_proj,0.00611763,0.01000,1.632
10,mlp.gate_proj,0.00474317,0.01000,1.328
10,mlp.down_proj,0.01347071,0.01000,2.937
11,self_attn.k_proj,0.00115821,0.01000,3.339
11,self_attn.v_proj,0.00065106,0.01000,2.422
11,self_attn.q_proj,0.00344706,0.01000,2.382
11,self_attn.o_proj,0.00740811,0.01000,2.400
11,mlp.up_proj,0.00620620,0.01000,2.718
11,mlp.gate_proj,0.00449832,0.01000,2.710
11,mlp.down_proj,0.27257532,0.01000,5.754
12,self_attn.k_proj,0.00163961,0.01000,0.344
12,self_attn.v_proj,0.00094356,0.01000,0.337
12,self_attn.q_proj,0.00456318,0.01000,0.338
12,self_attn.o_proj,0.00419531,0.01000,1.311
12,mlp.up_proj,0.00565002,0.01000,0.279
12,mlp.gate_proj,0.00445975,0.01000,1.091
12,mlp.down_proj,0.01192240,0.01000,4.327
13,self_attn.k_proj,0.00174242,0.01000,0.339
13,self_attn.v_proj,0.00083272,0.01000,0.344
13,self_attn.q_proj,0.00502530,0.01000,0.395
13,self_attn.o_proj,0.00500150,0.01000,0.343
13,mlp.up_proj,0.00570113,0.01000,1.926
13,mlp.gate_proj,0.00524486,0.01000,1.750
13,mlp.down_proj,0.01178209,0.01000,2.821
14,self_attn.k_proj,0.00200629,0.01000,0.361
14,self_attn.v_proj,0.00157519,0.01000,0.359
14,self_attn.q_proj,0.00566488,0.01000,0.366
14,self_attn.o_proj,0.00620107,0.01000,2.248
14,mlp.up_proj,0.00577955,0.01000,4.655
14,mlp.gate_proj,0.00547774,0.01000,5.042
14,mlp.down_proj,0.01469438,0.01000,8.832
15,self_attn.k_proj,0.00194205,0.01000,0.349
15,self_attn.v_proj,0.00151308,0.01000,0.345
15,self_attn.q_proj,0.00563300,0.01000,0.342
15,self_attn.o_proj,0.00601548,0.01000,0.344
15,mlp.up_proj,0.00601284,0.01000,0.342
15,mlp.gate_proj,0.00594717,0.01000,0.336
15,mlp.down_proj,0.01753610,0.01000,5.689
16,self_attn.k_proj,0.00155090,0.01000,1.763
16,self_attn.v_proj,0.00110804,0.01000,0.365
16,self_attn.q_proj,0.00422240,0.01000,0.357
16,self_attn.o_proj,0.00903260,0.01000,0.345
16,mlp.up_proj,0.00553630,0.01000,1.181
16,mlp.gate_proj,0.00532908,0.01000,1.499
16,mlp.down_proj,0.01532181,0.01000,5.315
17,self_attn.k_proj,0.00241632,0.01000,0.830
17,self_attn.v_proj,0.00194845,0.01000,2.641
17,self_attn.q_proj,0.00834111,0.01000,4.413
17,self_attn.o_proj,0.01061929,0.01000,2.746
17,mlp.up_proj,0.00562216,0.01000,2.742
17,mlp.gate_proj,0.00506327,0.01000,1.101
17,mlp.down_proj,0.01818097,0.01000,4.789
18,self_attn.k_proj,0.00273163,0.01000,2.613
18,self_attn.v_proj,0.00311299,0.01000,1.891
18,self_attn.q_proj,0.00828936,0.01000,0.344
18,self_attn.o_proj,0.00938506,0.01000,0.345
18,mlp.up_proj,0.00625932,0.01000,0.344
18,mlp.gate_proj,0.00583430,0.01000,0.339
18,mlp.down_proj,0.03318551,0.01000,2.234
19,self_attn.k_proj,0.00133622,0.01000,0.326
19,self_attn.v_proj,0.00225405,0.01000,0.800
19,self_attn.q_proj,0.00550781,0.01000,1.800
19,self_attn.o_proj,0.01567704,0.01000,0.449
19,mlp.up_proj,0.00725614,0.01000,2.903
19,mlp.gate_proj,0.00687203,0.01000,2.471
19,mlp.down_proj,0.03395692,0.01000,2.946
20,self_attn.k_proj,0.00182818,0.01000,0.388
20,self_attn.v_proj,0.00369986,0.01000,1.045
20,self_attn.q_proj,0.00668970,0.01000,3.772
20,self_attn.o_proj,0.01447436,0.01000,3.580
20,mlp.up_proj,0.00868652,0.01000,2.710
20,mlp.gate_proj,0.00763109,0.01000,1.037
20,mlp.down_proj,0.06614500,0.01000,3.153
21,self_attn.k_proj,0.00169165,0.01000,0.353
21,self_attn.v_proj,0.00278996,0.01000,1.556
21,self_attn.q_proj,0.00603606,0.01000,2.608
21,self_attn.o_proj,0.01160419,0.01000,2.633
21,mlp.up_proj,0.00941546,0.01000,2.761
21,mlp.gate_proj,0.00857336,0.01000,1.637
21,mlp.down_proj,0.05236044,0.01000,3.023
22,self_attn.k_proj,0.00173458,0.01000,0.340
22,self_attn.v_proj,0.00304587,0.01000,0.335
22,self_attn.q_proj,0.00609978,0.01000,1.500
22,self_attn.o_proj,0.01699413,0.01000,0.329
22,mlp.up_proj,0.01043702,0.01000,3.157
22,mlp.gate_proj,0.00901166,0.01000,2.403
22,mlp.down_proj,0.08635419,0.01000,2.277
23,self_attn.k_proj,0.00235798,0.01000,2.724
23,self_attn.v_proj,0.00853371,0.01000,2.700
23,self_attn.q_proj,0.00731025,0.01000,2.679
23,self_attn.o_proj,0.04595792,0.01000,0.347
23,mlp.up_proj,0.01267573,0.01000,1.922
23,mlp.gate_proj,0.00977481,0.01000,1.572
23,mlp.down_proj,0.09878369,0.01000,1.992
24,self_attn.k_proj,0.00193833,0.01000,0.352
24,self_attn.v_proj,0.00926276,0.01000,0.343
24,self_attn.q_proj,0.00732911,0.01000,0.354
24,self_attn.o_proj,0.02490180,0.01000,0.294
24,mlp.up_proj,0.01275103,0.01000,3.643
24,mlp.gate_proj,0.00968059,0.01000,4.339
24,mlp.down_proj,0.13135986,0.01000,6.748
25,self_attn.k_proj,0.00188807,0.01000,1.592
25,self_attn.v_proj,0.00410724,0.01000,1.087
25,self_attn.q_proj,0.00648702,0.01000,0.338
25,self_attn.o_proj,0.01829978,0.01000,1.828
25,mlp.up_proj,0.01323432,0.01000,0.353
25,mlp.gate_proj,0.01043347,0.01000,0.343
25,mlp.down_proj,0.10982227,0.01000,6.597
26,self_attn.k_proj,0.00186195,0.01000,3.885
26,self_attn.v_proj,0.00593649,0.01000,2.686
26,self_attn.q_proj,0.00663982,0.01000,0.818
26,self_attn.o_proj,0.02385299,0.01000,0.346
26,mlp.up_proj,0.01519259,0.01000,0.357
26,mlp.gate_proj,0.01179895,0.01000,0.383
26,mlp.down_proj,0.16240232,0.01000,2.805
27,self_attn.k_proj,0.00188216,0.01000,0.753
27,self_attn.v_proj,0.00480582,0.01000,2.568
27,self_attn.q_proj,0.00687713,0.01000,3.243
27,self_attn.o_proj,0.03130198,0.01000,1.944
27,mlp.up_proj,0.01527163,0.01000,0.361
27,mlp.gate_proj,0.01144433,0.01000,0.350
27,mlp.down_proj,0.20937583,0.01000,6.981
28,self_attn.k_proj,0.00163398,0.01000,2.274
28,self_attn.v_proj,0.00619308,0.01000,0.347
28,self_attn.q_proj,0.00561940,0.01000,1.200
28,self_attn.o_proj,0.02704479,0.01000,0.391
28,mlp.up_proj,0.01647252,0.01000,0.362
28,mlp.gate_proj,0.01167521,0.01000,0.348
28,mlp.down_proj,3.19434714,0.01000,7.166
29,self_attn.k_proj,0.00153822,0.01000,1.574
29,self_attn.v_proj,0.00717453,0.01000,0.978
29,self_attn.q_proj,0.00649254,0.01000,1.795
29,self_attn.o_proj,0.06275121,0.01000,0.949
29,mlp.up_proj,0.02440672,0.01000,2.122
29,mlp.gate_proj,0.01807862,0.01000,0.632
29,mlp.down_proj,0.86159390,0.01000,0.909