Abdohaaland's picture
Upload folder using huggingface_hub
f09e7d3 verified
layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000036928,0.05000,1.790
0,self_attn.o_proj,0.0000001945,0.05000,1.331
0,mlp.up_proj,0.0000102390,0.05000,2.562
0,mlp.gate_proj,0.0000106993,0.05000,2.597
0,mlp.down_proj,0.0000007873,0.05000,3.140
1,self_attn.qkv_proj,0.0000288658,0.05000,1.350
1,self_attn.o_proj,0.0000003944,0.05000,1.314
1,mlp.up_proj,0.0000151884,0.05000,3.192
1,mlp.gate_proj,0.0000162423,0.05000,3.248
1,mlp.down_proj,0.0000017862,0.05000,3.335
2,self_attn.qkv_proj,0.0000672307,0.05000,1.265
2,self_attn.o_proj,0.0000004262,0.05000,1.162
2,mlp.up_proj,0.0000219007,0.05000,2.728
2,mlp.gate_proj,0.0000236388,0.05000,2.739
2,mlp.down_proj,0.0000015235,0.05000,3.191
3,self_attn.qkv_proj,0.0000958284,0.05000,1.113
3,self_attn.o_proj,0.0000007994,0.05000,1.071
3,mlp.gate_proj,0.0000320000,0.05000,2.401
3,mlp.up_proj,0.0000289537,0.05000,2.435
3,mlp.down_proj,0.0003337474,0.05000,3.272
4,self_attn.qkv_proj,0.0000909789,0.05000,1.106
4,self_attn.o_proj,0.0000012312,0.05000,1.100
4,mlp.up_proj,0.0000345329,0.05000,2.538
4,mlp.gate_proj,0.0000400292,0.05000,2.554
4,mlp.down_proj,0.0000039765,0.05000,3.210
5,self_attn.qkv_proj,0.0001159516,0.05000,1.133
5,self_attn.o_proj,0.0000017395,0.05000,1.128
5,mlp.up_proj,0.0000430088,0.05000,2.448
5,mlp.gate_proj,0.0000509520,0.05000,2.467
5,mlp.down_proj,0.0000057463,0.05000,3.189
6,self_attn.qkv_proj,0.0000961327,0.05000,1.115
6,self_attn.o_proj,0.0000022428,0.05000,1.125
6,mlp.up_proj,0.0000430322,0.05000,2.552
6,mlp.gate_proj,0.0000487083,0.05000,2.587
6,mlp.down_proj,0.0000063000,0.05000,3.109
7,self_attn.qkv_proj,0.0001434261,0.05000,1.093
7,self_attn.o_proj,0.0000029053,0.05000,1.076
7,mlp.up_proj,0.0000461718,0.05000,2.553
7,mlp.gate_proj,0.0000501546,0.05000,2.579
7,mlp.down_proj,0.0000080737,0.05000,3.201
8,self_attn.qkv_proj,0.0001350463,0.05000,1.091
8,self_attn.o_proj,0.0000040604,0.05000,1.109
8,mlp.up_proj,0.0000482156,0.05000,2.403
8,mlp.gate_proj,0.0000492231,0.05000,2.431
8,mlp.down_proj,0.0000089525,0.05000,3.215
9,self_attn.qkv_proj,0.0001197565,0.05000,1.137
9,self_attn.o_proj,0.0000039595,0.05000,1.111
9,mlp.up_proj,0.0000522804,0.05000,2.498
9,mlp.gate_proj,0.0000520745,0.05000,2.531
9,mlp.down_proj,0.0000084691,0.05000,3.158
10,self_attn.qkv_proj,0.0001285350,0.05000,1.141
10,self_attn.o_proj,0.0000056212,0.05000,1.134
10,mlp.up_proj,0.0000538686,0.05000,2.537
10,mlp.gate_proj,0.0000539127,0.05000,2.535
10,mlp.down_proj,0.0000092388,0.05000,3.212
11,self_attn.qkv_proj,0.0001265468,0.05000,1.102
11,self_attn.o_proj,0.0000049263,0.05000,1.106
11,mlp.up_proj,0.0000561754,0.05000,2.543
11,mlp.gate_proj,0.0000538750,0.05000,2.569
11,mlp.down_proj,0.0000098257,0.05000,3.231
12,self_attn.qkv_proj,0.0001307771,0.05000,1.150
12,self_attn.o_proj,0.0000049451,0.05000,1.125
12,mlp.gate_proj,0.0000524987,0.05000,2.460
12,mlp.up_proj,0.0000571596,0.05000,2.484
12,mlp.down_proj,0.0000116566,0.05000,3.190
13,self_attn.qkv_proj,0.0001563531,0.05000,1.108
13,self_attn.o_proj,0.0000065090,0.05000,1.103
13,mlp.up_proj,0.0000612276,0.05000,2.490
13,mlp.gate_proj,0.0000543759,0.05000,2.508
13,mlp.down_proj,0.0000127317,0.05000,3.187
14,self_attn.qkv_proj,0.0001393042,0.05000,1.131
14,self_attn.o_proj,0.0000061571,0.05000,1.116
14,mlp.gate_proj,0.0000600704,0.05000,2.562
14,mlp.up_proj,0.0000672100,0.05000,2.584
14,mlp.down_proj,0.0000145146,0.05000,3.154
15,self_attn.qkv_proj,0.0001545983,0.05000,1.100
15,self_attn.o_proj,0.0000057894,0.05000,1.103
15,mlp.gate_proj,0.0000662487,0.05000,2.484
15,mlp.up_proj,0.0000739427,0.05000,2.506
15,mlp.down_proj,0.0000164698,0.05000,3.217
16,self_attn.qkv_proj,0.0001466132,0.05000,1.126
16,self_attn.o_proj,0.0000097625,0.05000,1.116
16,mlp.up_proj,0.0000786630,0.05000,2.562
16,mlp.gate_proj,0.0000699401,0.05000,2.584
16,mlp.down_proj,0.0000218803,0.05000,3.116
17,self_attn.qkv_proj,0.0001490546,0.05000,1.142
17,self_attn.o_proj,0.0000076505,0.05000,1.103
17,mlp.up_proj,0.0000841039,0.05000,2.591
17,mlp.gate_proj,0.0000739672,0.05000,2.615
17,mlp.down_proj,0.0000262042,0.05000,3.182
18,self_attn.qkv_proj,0.0001470632,0.05000,1.166
18,self_attn.o_proj,0.0000125533,0.05000,1.141
18,mlp.up_proj,0.0000932287,0.05000,2.532
18,mlp.gate_proj,0.0000829974,0.05000,2.548
18,mlp.down_proj,0.0000385317,0.05000,3.301
19,self_attn.qkv_proj,0.0001654606,0.05000,1.171
19,self_attn.o_proj,0.0000149239,0.05000,1.165
19,mlp.up_proj,0.0000991290,0.05000,2.623
19,mlp.gate_proj,0.0000894585,0.05000,2.664
19,mlp.down_proj,0.0000435778,0.05000,3.377
20,self_attn.qkv_proj,0.0001578730,0.05000,1.156
20,self_attn.o_proj,0.0000184642,0.05000,1.195
20,mlp.up_proj,0.0001209617,0.05000,2.661
20,mlp.gate_proj,0.0001092768,0.05000,2.687
20,mlp.down_proj,0.0000563793,0.05000,3.294
21,self_attn.qkv_proj,0.0001870555,0.05000,1.213
21,self_attn.o_proj,0.0000136906,0.05000,1.101
21,mlp.gate_proj,0.0001159161,0.05000,2.587
21,mlp.up_proj,0.0001299713,0.05000,2.605
21,mlp.down_proj,0.0000704598,0.05000,3.190
22,self_attn.qkv_proj,0.0001782628,0.05000,1.132
22,self_attn.o_proj,0.0000249007,0.05000,1.132
22,mlp.up_proj,0.0001397206,0.05000,2.564
22,mlp.gate_proj,0.0001231925,0.05000,2.572
22,mlp.down_proj,0.0000832951,0.05000,3.299
23,self_attn.qkv_proj,0.0001967909,0.05000,1.156
23,self_attn.o_proj,0.0000105388,0.05000,1.119
23,mlp.gate_proj,0.0001326374,0.05000,2.511
23,mlp.up_proj,0.0001492243,0.05000,2.540
23,mlp.down_proj,0.0000830157,0.05000,3.201
24,self_attn.qkv_proj,0.0002110393,0.05000,1.125
24,self_attn.o_proj,0.0000124396,0.05000,1.090
24,mlp.up_proj,0.0001615396,0.05000,2.512
24,mlp.gate_proj,0.0001421848,0.05000,2.535
24,mlp.down_proj,0.0000963378,0.05000,3.219
25,self_attn.qkv_proj,0.0002265083,0.05000,1.141
25,self_attn.o_proj,0.0000209731,0.05000,1.112
25,mlp.gate_proj,0.0001558134,0.05000,2.658
25,mlp.up_proj,0.0001774229,0.05000,2.676
25,mlp.down_proj,0.0001089506,0.05000,3.236
26,self_attn.qkv_proj,0.0001990848,0.05000,1.134
26,self_attn.o_proj,0.0000347294,0.05000,1.136
26,mlp.up_proj,0.0001846280,0.05000,2.560
26,mlp.gate_proj,0.0001625094,0.05000,2.582
26,mlp.down_proj,0.0001322558,0.05000,3.308
27,self_attn.qkv_proj,0.0001973591,0.05000,1.118
27,self_attn.o_proj,0.0000244647,0.05000,1.148
27,mlp.gate_proj,0.0001797843,0.05000,2.541
27,mlp.up_proj,0.0002011022,0.05000,2.557
27,mlp.down_proj,0.0001692445,0.05000,3.208
28,self_attn.qkv_proj,0.0002489807,0.05000,1.203
28,self_attn.o_proj,0.0000308398,0.05000,1.119
28,mlp.up_proj,0.0002172940,0.05000,2.558
28,mlp.gate_proj,0.0002009149,0.05000,2.579
28,mlp.down_proj,0.0002246512,0.05000,3.171
29,self_attn.qkv_proj,0.0002247108,0.05000,1.150
29,self_attn.o_proj,0.0000370290,0.05000,1.123
29,mlp.gate_proj,0.0002232223,0.05000,2.595
29,mlp.up_proj,0.0002207740,0.05000,2.619
29,mlp.down_proj,0.0003816118,0.05000,3.237
30,self_attn.qkv_proj,0.0001591859,0.05000,1.131
30,self_attn.o_proj,0.0000362225,0.05000,1.087
30,mlp.gate_proj,0.0002359733,0.05000,2.611
30,mlp.up_proj,0.0002075650,0.05000,2.634
30,mlp.down_proj,0.0014728911,0.05000,3.272
31,self_attn.qkv_proj,0.0000035844,0.05000,1.131
31,self_attn.o_proj,0.0000039555,0.05000,1.124
31,mlp.gate_proj,0.0001033877,0.05000,2.621
31,mlp.up_proj,0.0000604577,0.05000,2.628
31,mlp.down_proj,0.0004907257,0.05000,3.331