viveksil's picture
Add files using upload-large-folder tool
a9d52d6 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.06256382,0.01000,0.912
0,self_attn.v_proj,0.00067420,0.01000,0.181
0,self_attn.q_proj,0.10552374,0.01000,0.178
0,self_attn.o_proj,0.00050934,0.01000,0.173
0,mlp.up_proj,0.43543735,0.01000,0.197
0,mlp.gate_proj,0.41209504,0.01000,0.183
0,mlp.down_proj,1.74956274,0.01000,0.472
1,self_attn.k_proj,0.23321666,0.01000,0.181
1,self_attn.v_proj,0.04265926,0.01000,0.175
1,self_attn.q_proj,0.50713903,0.01000,0.192
1,self_attn.o_proj,0.29871464,0.01000,0.172
1,mlp.up_proj,0.52259123,0.01000,0.167
1,mlp.gate_proj,0.66429782,0.01000,0.177
1,mlp.down_proj,0.65793574,0.01000,0.467
2,self_attn.k_proj,0.37111092,0.01000,0.184
2,self_attn.v_proj,0.05978241,0.01000,0.178
2,self_attn.q_proj,0.85819304,0.01000,0.172
2,self_attn.o_proj,0.27943617,0.01000,0.176
2,mlp.up_proj,0.69902754,0.01000,0.177
2,mlp.gate_proj,0.83238852,0.01000,0.175
2,mlp.down_proj,1.32616901,0.01000,0.479
3,self_attn.k_proj,0.53480613,0.01000,0.174
3,self_attn.v_proj,0.19553483,0.01000,0.183
3,self_attn.q_proj,1.33299196,0.01000,0.179
3,self_attn.o_proj,0.36493903,0.01000,0.173
3,mlp.up_proj,0.79671907,0.01000,0.182
3,mlp.gate_proj,0.90231085,0.01000,0.178
3,mlp.down_proj,0.99806905,0.01000,0.464
4,self_attn.k_proj,0.52328622,0.01000,0.178
4,self_attn.v_proj,0.19324306,0.01000,0.203
4,self_attn.q_proj,1.25000870,0.01000,0.218
4,self_attn.o_proj,0.50261188,0.01000,0.193
4,mlp.up_proj,1.04450798,0.01000,0.174
4,mlp.gate_proj,1.19090462,0.01000,0.175
4,mlp.down_proj,1.37261415,0.01000,0.549
5,self_attn.k_proj,0.56460476,0.01000,0.189
5,self_attn.v_proj,0.20564502,0.01000,0.189
5,self_attn.q_proj,1.31891513,0.01000,0.177
5,self_attn.o_proj,0.53682232,0.01000,0.181
5,mlp.up_proj,1.20378089,0.01000,0.180
5,mlp.gate_proj,1.32316709,0.01000,0.173
5,mlp.down_proj,1.63578343,0.01000,0.457
6,self_attn.k_proj,0.48800462,0.01000,0.193
6,self_attn.v_proj,0.19285259,0.01000,0.167
6,self_attn.q_proj,1.18869805,0.01000,0.178
6,self_attn.o_proj,0.56184769,0.01000,0.181
6,mlp.up_proj,1.28443360,0.01000,0.183
6,mlp.gate_proj,1.31438851,0.01000,0.192
6,mlp.down_proj,2.06012201,0.01000,0.485
7,self_attn.k_proj,0.66432202,0.01000,0.186
7,self_attn.v_proj,0.39548156,0.01000,0.172
7,self_attn.q_proj,1.84067345,0.01000,0.186
7,self_attn.o_proj,0.54949433,0.01000,0.180
7,mlp.up_proj,1.41139817,0.01000,0.194
7,mlp.gate_proj,1.39311254,0.01000,0.181
7,mlp.down_proj,2.45634985,0.01000,0.515
8,self_attn.k_proj,0.61689150,0.01000,0.178
8,self_attn.v_proj,0.29743513,0.01000,0.177
8,self_attn.q_proj,1.56349242,0.01000,0.166
8,self_attn.o_proj,0.80368316,0.01000,0.184
8,mlp.up_proj,1.61489773,0.01000,0.178
8,mlp.gate_proj,1.47358894,0.01000,0.181
8,mlp.down_proj,3.48785520,0.01000,0.462
9,self_attn.k_proj,0.42029348,0.01000,0.196
9,self_attn.v_proj,0.16713354,0.01000,0.198
9,self_attn.q_proj,1.14550853,0.01000,0.196
9,self_attn.o_proj,0.75486600,0.01000,0.175
9,mlp.up_proj,1.75040460,0.01000,0.175
9,mlp.gate_proj,1.44231176,0.01000,0.173
9,mlp.down_proj,4.26337147,0.01000,0.484
10,self_attn.k_proj,0.39127934,0.01000,0.178
10,self_attn.v_proj,0.19020256,0.01000,0.173
10,self_attn.q_proj,1.07599604,0.01000,0.184
10,self_attn.o_proj,1.62916851,0.01000,0.181
10,mlp.up_proj,1.79141831,0.01000,0.187
10,mlp.gate_proj,1.39241314,0.01000,0.172
10,mlp.down_proj,3.97726178,0.01000,0.472
11,self_attn.k_proj,0.33525729,0.01000,0.181
11,self_attn.v_proj,0.18537275,0.01000,0.171
11,self_attn.q_proj,1.01370001,0.01000,0.199
11,self_attn.o_proj,2.12376404,0.01000,0.180
11,mlp.up_proj,1.82445931,0.01000,0.183
11,mlp.gate_proj,1.32806182,0.01000,0.184
11,mlp.down_proj,186.60597229,0.01000,0.472
12,self_attn.k_proj,0.48405319,0.01000,0.172
12,self_attn.v_proj,0.25698844,0.01000,0.178
12,self_attn.q_proj,1.33479750,0.01000,0.189
12,self_attn.o_proj,1.04103160,0.01000,0.169
12,mlp.up_proj,1.66709638,0.01000,0.174
12,mlp.gate_proj,1.31850982,0.01000,0.168
12,mlp.down_proj,3.67623878,0.01000,0.459
13,self_attn.k_proj,0.52306521,0.01000,0.165
13,self_attn.v_proj,0.23163638,0.01000,0.193
13,self_attn.q_proj,1.48274660,0.01000,0.181
13,self_attn.o_proj,1.52564883,0.01000,0.161
13,mlp.up_proj,1.69629693,0.01000,0.176
13,mlp.gate_proj,1.56363511,0.01000,0.167
13,mlp.down_proj,3.77285790,0.01000,0.463
14,self_attn.k_proj,0.61791062,0.01000,0.176
14,self_attn.v_proj,0.45429951,0.01000,0.173
14,self_attn.q_proj,1.68052852,0.01000,0.186
14,self_attn.o_proj,2.28644967,0.01000,0.180
14,mlp.up_proj,1.72145450,0.01000,0.176
14,mlp.gate_proj,1.63012791,0.01000,0.172
14,mlp.down_proj,4.74705410,0.01000,0.470
15,self_attn.k_proj,0.57124710,0.01000,0.165
15,self_attn.v_proj,0.44042420,0.01000,0.166
15,self_attn.q_proj,1.67077899,0.01000,0.165
15,self_attn.o_proj,1.74314666,0.01000,0.167
15,mlp.up_proj,1.80302763,0.01000,0.164
15,mlp.gate_proj,1.79691231,0.01000,0.175
15,mlp.down_proj,5.59943199,0.01000,0.458
16,self_attn.k_proj,0.47524801,0.01000,0.232
16,self_attn.v_proj,0.32663453,0.01000,0.197
16,self_attn.q_proj,1.27558899,0.01000,0.157
16,self_attn.o_proj,2.69648743,0.01000,0.190
16,mlp.up_proj,1.65323758,0.01000,0.168
16,mlp.gate_proj,1.59195709,0.01000,0.162
16,mlp.down_proj,4.76000500,0.01000,0.431
17,self_attn.k_proj,0.71847141,0.01000,0.176
17,self_attn.v_proj,0.58196855,0.01000,0.170
17,self_attn.q_proj,2.49759388,0.01000,0.160
17,self_attn.o_proj,3.47188544,0.01000,0.151
17,mlp.up_proj,1.68230438,0.01000,0.155
17,mlp.gate_proj,1.51063716,0.01000,0.165
17,mlp.down_proj,5.52115583,0.01000,0.448
18,self_attn.k_proj,0.80530590,0.01000,0.157
18,self_attn.v_proj,0.92182064,0.01000,0.149
18,self_attn.q_proj,2.45034838,0.01000,0.155
18,self_attn.o_proj,3.25234222,0.01000,0.156
18,mlp.up_proj,1.84351170,0.01000,0.166
18,mlp.gate_proj,1.71802044,0.01000,0.168
18,mlp.down_proj,9.79771233,0.01000,0.443
19,self_attn.k_proj,0.39786786,0.01000,0.150
19,self_attn.v_proj,0.64931679,0.01000,0.146
19,self_attn.q_proj,1.62448215,0.01000,0.140
19,self_attn.o_proj,4.78523493,0.01000,0.148
19,mlp.up_proj,2.13052177,0.01000,0.148
19,mlp.gate_proj,2.01595855,0.01000,0.136
19,mlp.down_proj,9.97483063,0.01000,0.449
20,self_attn.k_proj,0.54920471,0.01000,0.161
20,self_attn.v_proj,1.10783672,0.01000,0.143
20,self_attn.q_proj,1.99741817,0.01000,0.163
20,self_attn.o_proj,4.60960484,0.01000,0.160
20,mlp.up_proj,2.55869007,0.01000,0.184
20,mlp.gate_proj,2.24854302,0.01000,0.232
20,mlp.down_proj,19.55944443,0.01000,0.590
21,self_attn.k_proj,0.50769174,0.01000,0.198
21,self_attn.v_proj,0.80476671,0.01000,0.192
21,self_attn.q_proj,1.79272270,0.01000,0.724
21,self_attn.o_proj,3.74716043,0.01000,0.232
21,mlp.up_proj,2.81642342,0.01000,0.233
21,mlp.gate_proj,2.56334019,0.01000,0.170
21,mlp.down_proj,15.52727795,0.01000,0.435
22,self_attn.k_proj,0.51919383,0.01000,0.197
22,self_attn.v_proj,0.89571881,0.01000,0.190
22,self_attn.q_proj,1.81653953,0.01000,0.165
22,self_attn.o_proj,5.18839121,0.01000,0.142
22,mlp.up_proj,3.13495636,0.01000,0.143
22,mlp.gate_proj,2.69524765,0.01000,0.148
22,mlp.down_proj,25.87879562,0.01000,0.433
23,self_attn.k_proj,0.69609213,0.01000,0.164
23,self_attn.v_proj,2.49952078,0.01000,0.157
23,self_attn.q_proj,2.21693826,0.01000,0.173
23,self_attn.o_proj,14.39114189,0.01000,0.158
23,mlp.up_proj,3.68463898,0.01000,0.171
23,mlp.gate_proj,2.83276129,0.01000,0.171
23,mlp.down_proj,28.22217178,0.01000,0.517
24,self_attn.k_proj,0.55973732,0.01000,0.162
24,self_attn.v_proj,2.60700345,0.01000,0.192
24,self_attn.q_proj,2.10726285,0.01000,0.162
24,self_attn.o_proj,7.63801670,0.01000,0.147
24,mlp.up_proj,3.54918289,0.01000,0.180
24,mlp.gate_proj,2.68827343,0.01000,0.169
24,mlp.down_proj,34.21448898,0.01000,0.428
25,self_attn.k_proj,0.52059758,0.01000,0.168
25,self_attn.v_proj,1.12329173,0.01000,0.161
25,self_attn.q_proj,1.77156615,0.01000,0.180
25,self_attn.o_proj,4.51467705,0.01000,0.153
25,mlp.up_proj,3.59808350,0.01000,0.161
25,mlp.gate_proj,2.82035089,0.01000,0.156
25,mlp.down_proj,27.07238770,0.01000,0.443
26,self_attn.k_proj,0.50036329,0.01000,0.157
26,self_attn.v_proj,1.58541822,0.01000,0.157
26,self_attn.q_proj,1.78324258,0.01000,0.161
26,self_attn.o_proj,6.87056065,0.01000,0.159
26,mlp.up_proj,4.04652023,0.01000,0.162
26,mlp.gate_proj,3.15157461,0.01000,0.161
26,mlp.down_proj,39.47451019,0.01000,0.504
27,self_attn.k_proj,0.49251500,0.01000,0.178
27,self_attn.v_proj,1.25342071,0.01000,0.153
27,self_attn.q_proj,1.81785595,0.01000,0.163
27,self_attn.o_proj,8.08690166,0.01000,0.155
27,mlp.up_proj,4.07105541,0.01000,0.174
27,mlp.gate_proj,2.98313332,0.01000,0.144
27,mlp.down_proj,50.69013214,0.01000,0.420
28,self_attn.k_proj,0.42138153,0.01000,0.154
28,self_attn.v_proj,1.60022080,0.01000,0.153
28,self_attn.q_proj,1.44547224,0.01000,0.151
28,self_attn.o_proj,7.02755356,0.01000,0.173
28,mlp.up_proj,4.30956984,0.01000,0.177
28,mlp.gate_proj,2.99873185,0.01000,0.157
28,mlp.down_proj,598.39166260,0.01000,0.427
29,self_attn.k_proj,0.39156410,0.01000,0.154
29,self_attn.v_proj,1.81828201,0.01000,0.157
29,self_attn.q_proj,1.65555286,0.01000,0.148
29,self_attn.o_proj,15.22791958,0.01000,0.213
29,mlp.up_proj,6.40628767,0.01000,0.168
29,mlp.gate_proj,4.79352283,0.01000,0.186
29,mlp.down_proj,229.68667603,0.01000,0.506