yongqiang
Initialize this repo
81ea8f1
layer,module,loss,samples,damp,time
0,self_attn.q_proj,0.0000000157,0.01000,0.453
0,self_attn.k_proj,0.0000000070,0.01000,0.218
0,self_attn.v_proj,0.0000000055,0.01000,0.220
0,self_attn.o_proj,0.0000000039,0.01000,0.433
0,mlp.gate_proj,0.0000001457,0.01000,0.216
0,mlp.up_proj,0.0000000745,0.01000,0.215
0,mlp.down_proj,0.0000000050,0.01000,0.652
1,self_attn.q_proj,0.0000000056,0.01000,0.286
1,self_attn.k_proj,0.0000000025,0.01000,0.217
1,self_attn.v_proj,0.0000000024,0.01000,0.217
1,self_attn.o_proj,0.0000000010,0.01000,0.434
1,mlp.gate_proj,0.0000008918,0.01000,0.216
1,mlp.up_proj,0.0000002667,0.01000,0.216
1,mlp.down_proj,0.0000000066,0.01000,0.659
2,self_attn.q_proj,0.0000000110,0.01000,0.255
2,self_attn.k_proj,0.0000000047,0.01000,0.219
2,self_attn.v_proj,0.0000000046,0.01000,0.218
2,self_attn.o_proj,0.0000000016,0.01000,0.435
2,mlp.gate_proj,0.0000006115,0.01000,0.219
2,mlp.up_proj,0.0000002231,0.01000,0.218
2,mlp.down_proj,0.0000078325,0.01000,0.661
3,self_attn.q_proj,0.0000000868,0.01000,0.260
3,self_attn.k_proj,0.0000000421,0.01000,0.220
3,self_attn.v_proj,0.0000000429,0.01000,0.219
3,self_attn.o_proj,0.0000000023,0.01000,0.442
3,mlp.gate_proj,0.0000008147,0.01000,0.218
3,mlp.up_proj,0.0000003186,0.01000,0.218
3,mlp.down_proj,0.0000000175,0.01000,0.701
4,self_attn.q_proj,0.0000000812,0.01000,0.263
4,self_attn.k_proj,0.0000000383,0.01000,0.217
4,self_attn.v_proj,0.0000000410,0.01000,0.219
4,self_attn.o_proj,0.0000000053,0.01000,0.437
4,mlp.gate_proj,0.0000007532,0.01000,0.219
4,mlp.up_proj,0.0000003315,0.01000,0.218
4,mlp.down_proj,0.0000000219,0.01000,0.659
5,self_attn.q_proj,0.0000001455,0.01000,0.262
5,self_attn.k_proj,0.0000000597,0.01000,0.223
5,self_attn.v_proj,0.0000000636,0.01000,0.226
5,self_attn.o_proj,0.0000000076,0.01000,0.452
5,mlp.gate_proj,0.0000005187,0.01000,0.223
5,mlp.up_proj,0.0000003102,0.01000,0.218
5,mlp.down_proj,0.0000000246,0.01000,0.664
6,self_attn.q_proj,0.0000000990,0.01000,0.257
6,self_attn.k_proj,0.0000000439,0.01000,0.222
6,self_attn.v_proj,0.0000000422,0.01000,0.218
6,self_attn.o_proj,0.0000000059,0.01000,0.438
6,mlp.gate_proj,0.0000006165,0.01000,0.216
6,mlp.up_proj,0.0000003886,0.01000,0.216
6,mlp.down_proj,0.0000000316,0.01000,0.661
7,self_attn.q_proj,0.0000001937,0.01000,0.282
7,self_attn.k_proj,0.0000000798,0.01000,0.249
7,self_attn.v_proj,0.0000000900,0.01000,0.246
7,self_attn.o_proj,0.0000000101,0.01000,0.490
7,mlp.gate_proj,0.0000007165,0.01000,0.243
7,mlp.up_proj,0.0000004434,0.01000,0.243
7,mlp.down_proj,0.0000000395,0.01000,0.700
8,self_attn.q_proj,0.0000002418,0.01000,0.257
8,self_attn.k_proj,0.0000001092,0.01000,0.221
8,self_attn.v_proj,0.0000001022,0.01000,0.217
8,self_attn.o_proj,0.0000000103,0.01000,0.435
8,mlp.gate_proj,0.0000007137,0.01000,0.218
8,mlp.up_proj,0.0000004578,0.01000,0.216
8,mlp.down_proj,0.0000000417,0.01000,0.659
9,self_attn.q_proj,0.0000004561,0.01000,0.291
9,self_attn.k_proj,0.0000001857,0.01000,0.219
9,self_attn.v_proj,0.0000001929,0.01000,0.221
9,self_attn.o_proj,0.0000000167,0.01000,0.439
9,mlp.gate_proj,0.0000007954,0.01000,0.220
9,mlp.up_proj,0.0000004992,0.01000,0.218
9,mlp.down_proj,0.0000000556,0.01000,0.661
10,self_attn.q_proj,0.0000003840,0.01000,0.289
10,self_attn.k_proj,0.0000001600,0.01000,0.220
10,self_attn.v_proj,0.0000001638,0.01000,0.220
10,self_attn.o_proj,0.0000000157,0.01000,0.446
10,mlp.gate_proj,0.0000008065,0.01000,0.221
10,mlp.up_proj,0.0000005084,0.01000,0.222
10,mlp.down_proj,0.0000000788,0.01000,0.671
11,self_attn.q_proj,0.0000008024,0.01000,0.283
11,self_attn.k_proj,0.0000003071,0.01000,0.239
11,self_attn.v_proj,0.0000002804,0.01000,0.220
11,self_attn.o_proj,0.0000000493,0.01000,0.443
11,mlp.gate_proj,0.0000006262,0.01000,0.220
11,mlp.up_proj,0.0000004808,0.01000,0.220
11,mlp.down_proj,0.0000000880,0.01000,0.668
12,self_attn.q_proj,0.0000007135,0.01000,0.266
12,self_attn.k_proj,0.0000002560,0.01000,0.218
12,self_attn.v_proj,0.0000002706,0.01000,0.215
12,self_attn.o_proj,0.0000000163,0.01000,0.443
12,mlp.gate_proj,0.0000005636,0.01000,0.215
12,mlp.up_proj,0.0000004659,0.01000,0.216
12,mlp.down_proj,0.0000000890,0.01000,0.659
13,self_attn.q_proj,0.0000007450,0.01000,0.255
13,self_attn.k_proj,0.0000002548,0.01000,0.215
13,self_attn.v_proj,0.0000002986,0.01000,0.215
13,self_attn.o_proj,0.0000000196,0.01000,0.432
13,mlp.gate_proj,0.0000006345,0.01000,0.214
13,mlp.up_proj,0.0000005136,0.01000,0.218
13,mlp.down_proj,0.0000000943,0.01000,0.656
14,self_attn.q_proj,0.0000010099,0.01000,0.258
14,self_attn.k_proj,0.0000003666,0.01000,0.215
14,self_attn.v_proj,0.0000003883,0.01000,0.215
14,self_attn.o_proj,0.0000000272,0.01000,0.435
14,mlp.gate_proj,0.0000006731,0.01000,0.215
14,mlp.up_proj,0.0000005531,0.01000,0.217
14,mlp.down_proj,0.0000001202,0.01000,0.653
15,self_attn.q_proj,0.0000019066,0.01000,0.286
15,self_attn.k_proj,0.0000005995,0.01000,0.218
15,self_attn.v_proj,0.0000007671,0.01000,0.215
15,self_attn.o_proj,0.0000000275,0.01000,0.434
15,mlp.gate_proj,0.0000007228,0.01000,0.215
15,mlp.up_proj,0.0000006042,0.01000,0.215
15,mlp.down_proj,0.0000001389,0.01000,0.656
16,self_attn.q_proj,0.0000023607,0.01000,0.288
16,self_attn.k_proj,0.0000008254,0.01000,0.216
16,self_attn.v_proj,0.0000007666,0.01000,0.215
16,self_attn.o_proj,0.0000000499,0.01000,0.436
16,mlp.gate_proj,0.0000007419,0.01000,0.213
16,mlp.up_proj,0.0000006750,0.01000,0.215
16,mlp.down_proj,0.0000002760,0.01000,0.653
17,self_attn.q_proj,0.0000051417,0.01000,0.286
17,self_attn.k_proj,0.0000016262,0.01000,0.216
17,self_attn.v_proj,0.0000019666,0.01000,0.215
17,self_attn.o_proj,0.0000001240,0.01000,0.433
17,mlp.gate_proj,0.0000010348,0.01000,0.216
17,mlp.up_proj,0.0000009428,0.01000,0.213
17,mlp.down_proj,0.0000003055,0.01000,0.656
18,self_attn.q_proj,0.0000046798,0.01000,0.266
18,self_attn.k_proj,0.0000014684,0.01000,0.216
18,self_attn.v_proj,0.0000017435,0.01000,0.216
18,self_attn.o_proj,0.0000000528,0.01000,0.432
18,mlp.gate_proj,0.0000011800,0.01000,0.214
18,mlp.up_proj,0.0000010920,0.01000,0.213
18,mlp.down_proj,0.0000005320,0.01000,0.651
19,self_attn.q_proj,0.0000081104,0.01000,0.262
19,self_attn.k_proj,0.0000023922,0.01000,0.216
19,self_attn.v_proj,0.0000029877,0.01000,0.215
19,self_attn.o_proj,0.0000001101,0.01000,0.433
19,mlp.gate_proj,0.0000012617,0.01000,0.214
19,mlp.up_proj,0.0000013705,0.01000,0.214
19,mlp.down_proj,0.0000010956,0.01000,0.654
20,self_attn.q_proj,0.0000104670,0.01000,0.278
20,self_attn.k_proj,0.0000034022,0.01000,0.243
20,self_attn.v_proj,0.0000042421,0.01000,0.243
20,self_attn.o_proj,0.0000001907,0.01000,0.493
20,mlp.gate_proj,0.0000013812,0.01000,0.242
20,mlp.up_proj,0.0000015767,0.01000,0.242
20,mlp.down_proj,0.0000016353,0.01000,0.748
21,self_attn.q_proj,0.0000185475,0.01000,0.276
21,self_attn.k_proj,0.0000059908,0.01000,0.242
21,self_attn.v_proj,0.0000075683,0.01000,0.242
21,self_attn.o_proj,0.0000003463,0.01000,0.487
21,mlp.gate_proj,0.0000014603,0.01000,0.239
21,mlp.up_proj,0.0000018684,0.01000,0.239
21,mlp.down_proj,0.0000023298,0.01000,0.744
22,self_attn.q_proj,0.0000192655,0.01000,0.280
22,self_attn.k_proj,0.0000066621,0.01000,0.248
22,self_attn.v_proj,0.0000090980,0.01000,0.250
22,self_attn.o_proj,0.0000002642,0.01000,0.503
22,mlp.gate_proj,0.0000016697,0.01000,0.243
22,mlp.up_proj,0.0000021728,0.01000,0.240
22,mlp.down_proj,0.0000026377,0.01000,0.750
23,self_attn.q_proj,0.0000223355,0.01000,0.282
23,self_attn.k_proj,0.0000091246,0.01000,0.251
23,self_attn.v_proj,0.0000111566,0.01000,0.250
23,self_attn.o_proj,0.0000002412,0.01000,0.487
23,mlp.gate_proj,0.0000018961,0.01000,0.243
23,mlp.up_proj,0.0000025225,0.01000,0.239
23,mlp.down_proj,0.0000023748,0.01000,0.733
24,self_attn.q_proj,0.0000478594,0.01000,0.277
24,self_attn.k_proj,0.0000162195,0.01000,0.244
24,self_attn.v_proj,0.0000187105,0.01000,0.244
24,self_attn.o_proj,0.0000003140,0.01000,0.490
24,mlp.gate_proj,0.0000018491,0.01000,0.242
24,mlp.up_proj,0.0000025646,0.01000,0.241
24,mlp.down_proj,0.0000022875,0.01000,0.743
25,self_attn.q_proj,0.0000736474,0.01000,0.261
25,self_attn.k_proj,0.0000219495,0.01000,0.218
25,self_attn.v_proj,0.0000348672,0.01000,0.220
25,self_attn.o_proj,0.0000005398,0.01000,0.441
25,mlp.gate_proj,0.0000018458,0.01000,0.217
25,mlp.up_proj,0.0000026985,0.01000,0.217
25,mlp.down_proj,0.0000027734,0.01000,0.647
26,self_attn.q_proj,0.0000973767,0.01000,0.251
26,self_attn.k_proj,0.0000243580,0.01000,0.241
26,self_attn.v_proj,0.0000364561,0.01000,0.243
26,self_attn.o_proj,0.0000044389,0.01000,0.485
26,mlp.gate_proj,0.0000018377,0.01000,0.240
26,mlp.up_proj,0.0000026512,0.01000,0.246
26,mlp.down_proj,0.0000062773,0.01000,0.744
27,self_attn.q_proj,0.0000334389,0.01000,0.290
27,self_attn.k_proj,0.0000149378,0.01000,0.243
27,self_attn.v_proj,0.0000184760,0.01000,0.243
27,self_attn.o_proj,0.0000022290,0.01000,0.489
27,mlp.gate_proj,0.0000068754,0.01000,0.242
27,mlp.up_proj,0.0000081715,0.01000,0.240
27,mlp.down_proj,0.0000067090,0.01000,0.735