File size: 7,440 Bytes
ba242ea | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00268859,0.01000,2.297
0,self_attn.v_proj,0.00012146,0.01000,1.532
0,self_attn.q_proj,0.00339818,0.01000,1.401
0,self_attn.o_proj,0.00007466,0.01000,3.458
0,mlp.up_proj,0.00165959,0.01000,3.002
0,mlp.gate_proj,0.00176081,0.01000,2.685
0,mlp.down_proj,0.00171541,0.01000,19.171
1,self_attn.k_proj,0.00514033,0.01000,3.422
1,self_attn.v_proj,0.00119326,0.01000,3.608
1,self_attn.q_proj,0.00603395,0.01000,1.613
1,self_attn.o_proj,0.00048323,0.01000,3.834
1,mlp.up_proj,0.00365061,0.01000,1.590
1,mlp.gate_proj,0.00421130,0.01000,6.380
1,mlp.down_proj,0.02673751,0.01000,7.127
2,self_attn.k_proj,0.00933676,0.01000,1.540
2,self_attn.v_proj,0.00363998,0.01000,2.579
2,self_attn.q_proj,0.01070433,0.01000,3.024
2,self_attn.o_proj,0.00095308,0.01000,1.640
2,mlp.up_proj,0.00610160,0.01000,10.450
2,mlp.gate_proj,0.00684849,0.01000,3.323
2,mlp.down_proj,0.00416326,0.01000,11.194
3,self_attn.k_proj,0.01245183,0.01000,3.158
3,self_attn.v_proj,0.00521770,0.01000,3.034
3,self_attn.q_proj,0.01259811,0.01000,3.280
3,self_attn.o_proj,0.00154380,0.01000,8.060
3,mlp.up_proj,0.00826654,0.01000,1.420
3,mlp.gate_proj,0.00868698,0.01000,1.575
3,mlp.down_proj,0.00818474,0.01000,12.702
4,self_attn.k_proj,0.01399883,0.01000,2.538
4,self_attn.v_proj,0.00609351,0.01000,9.978
4,self_attn.q_proj,0.01455349,0.01000,4.893
4,self_attn.o_proj,0.00308353,0.01000,1.867
4,mlp.up_proj,0.01101172,0.01000,1.507
4,mlp.gate_proj,0.01136096,0.01000,3.298
4,mlp.down_proj,0.01204515,0.01000,11.278
5,self_attn.k_proj,0.01381846,0.01000,5.158
5,self_attn.v_proj,0.00638836,0.01000,1.610
5,self_attn.q_proj,0.01450016,0.01000,1.798
5,self_attn.o_proj,0.00360254,0.01000,1.624
5,mlp.up_proj,0.01348488,0.01000,4.580
5,mlp.gate_proj,0.01340446,0.01000,1.761
5,mlp.down_proj,0.01536761,0.01000,22.166
6,self_attn.k_proj,0.01536616,0.01000,1.813
6,self_attn.v_proj,0.00765775,0.01000,1.057
6,self_attn.q_proj,0.01647044,0.01000,1.589
6,self_attn.o_proj,0.00484225,0.01000,1.817
6,mlp.up_proj,0.01586073,0.01000,2.670
6,mlp.gate_proj,0.01545403,0.01000,2.092
6,mlp.down_proj,0.01897714,0.01000,16.333
7,self_attn.k_proj,0.01551268,0.01000,2.392
7,self_attn.v_proj,0.00767670,0.01000,0.989
7,self_attn.q_proj,0.01955890,0.01000,2.897
7,self_attn.o_proj,0.00776187,0.01000,3.109
7,mlp.up_proj,0.02011534,0.01000,5.595
7,mlp.gate_proj,0.01881913,0.01000,8.879
7,mlp.down_proj,0.13795254,0.01000,5.252
8,self_attn.k_proj,0.01517920,0.01000,2.907
8,self_attn.v_proj,0.01077128,0.01000,3.195
8,self_attn.q_proj,0.01539815,0.01000,0.929
8,self_attn.o_proj,0.01244297,0.01000,8.706
8,mlp.up_proj,0.02336273,0.01000,1.006
8,mlp.gate_proj,0.02230725,0.01000,0.914
8,mlp.down_proj,0.03689886,0.01000,7.602
9,self_attn.k_proj,0.01419967,0.01000,3.176
9,self_attn.v_proj,0.00935659,0.01000,0.916
9,self_attn.q_proj,0.01437793,0.01000,7.752
9,self_attn.o_proj,0.01545753,0.01000,1.956
9,mlp.up_proj,0.02452471,0.01000,1.045
9,mlp.gate_proj,0.02163836,0.01000,0.934
9,mlp.down_proj,0.04093376,0.01000,8.590
10,self_attn.k_proj,0.01597095,0.01000,7.668
10,self_attn.v_proj,0.01030280,0.01000,0.955
10,self_attn.q_proj,0.01661386,0.01000,0.953
10,self_attn.o_proj,0.02046761,0.01000,0.961
10,mlp.up_proj,0.02449678,0.01000,1.783
10,mlp.gate_proj,0.02200876,0.01000,3.467
10,mlp.down_proj,0.04767245,0.01000,12.654
11,self_attn.k_proj,0.01583570,0.01000,0.988
11,self_attn.v_proj,0.01004474,0.01000,1.007
11,self_attn.q_proj,0.01681633,0.01000,0.953
11,self_attn.o_proj,0.02400013,0.01000,0.944
11,mlp.up_proj,0.02487121,0.01000,2.184
11,mlp.gate_proj,0.02244228,0.01000,0.996
11,mlp.down_proj,0.05173288,0.01000,18.105
12,self_attn.k_proj,0.01769731,0.01000,0.839
12,self_attn.v_proj,0.01472340,0.01000,0.551
12,self_attn.q_proj,0.01947594,0.01000,0.509
12,self_attn.o_proj,0.03308697,0.01000,0.642
12,mlp.up_proj,0.02705463,0.01000,0.573
12,mlp.gate_proj,0.02433215,0.01000,0.640
12,mlp.down_proj,0.06660484,0.01000,2.787
13,self_attn.k_proj,0.01724737,0.01000,0.509
13,self_attn.v_proj,0.01275570,0.01000,0.494
13,self_attn.q_proj,0.01846544,0.01000,0.557
13,self_attn.o_proj,0.02876754,0.01000,0.545
13,mlp.up_proj,0.02806181,0.01000,0.560
13,mlp.gate_proj,0.02527489,0.01000,0.524
13,mlp.down_proj,0.07755652,0.01000,2.416
14,self_attn.k_proj,0.01810676,0.01000,0.578
14,self_attn.v_proj,0.01431919,0.01000,0.505
14,self_attn.q_proj,0.01790303,0.01000,0.502
14,self_attn.o_proj,0.03729445,0.01000,0.527
14,mlp.up_proj,0.03043460,0.01000,0.550
14,mlp.gate_proj,0.02668553,0.01000,0.534
14,mlp.down_proj,0.10596363,0.01000,2.331
15,self_attn.k_proj,0.01930179,0.01000,0.515
15,self_attn.v_proj,0.02241649,0.01000,0.496
15,self_attn.q_proj,0.02011626,0.01000,0.497
15,self_attn.o_proj,0.05061907,0.01000,0.566
15,mlp.up_proj,0.03395730,0.01000,0.569
15,mlp.gate_proj,0.02911986,0.01000,0.593
15,mlp.down_proj,0.14194915,0.01000,2.274
16,self_attn.k_proj,0.02059570,0.01000,0.511
16,self_attn.v_proj,0.02086210,0.01000,0.496
16,self_attn.q_proj,0.02103812,0.01000,0.489
16,self_attn.o_proj,0.05604012,0.01000,0.514
16,mlp.up_proj,0.04187595,0.01000,0.539
16,mlp.gate_proj,0.03528344,0.01000,0.510
16,mlp.down_proj,0.21391028,0.01000,2.362
17,self_attn.k_proj,0.01972736,0.01000,0.528
17,self_attn.v_proj,0.02926025,0.01000,0.498
17,self_attn.q_proj,0.02005677,0.01000,0.498
17,self_attn.o_proj,0.09542210,0.01000,0.517
17,mlp.up_proj,0.04948561,0.01000,0.617
17,mlp.gate_proj,0.04208370,0.01000,0.527
17,mlp.down_proj,0.30404621,0.01000,2.336
18,self_attn.k_proj,0.01914989,0.01000,0.672
18,self_attn.v_proj,0.03310600,0.01000,0.540
18,self_attn.q_proj,0.02003000,0.01000,0.524
18,self_attn.o_proj,0.10906528,0.01000,0.543
18,mlp.up_proj,0.06152352,0.01000,0.530
18,mlp.gate_proj,0.05048580,0.01000,0.507
18,mlp.down_proj,0.47315487,0.01000,2.273
19,self_attn.k_proj,0.01988266,0.01000,0.521
19,self_attn.v_proj,0.04468218,0.01000,0.504
19,self_attn.q_proj,0.02098379,0.01000,0.499
19,self_attn.o_proj,0.11830558,0.01000,0.524
19,mlp.up_proj,0.07140406,0.01000,0.569
19,mlp.gate_proj,0.05682839,0.01000,0.516
19,mlp.down_proj,0.64388824,0.01000,2.303
20,self_attn.k_proj,0.01980521,0.01000,0.517
20,self_attn.v_proj,0.05296587,0.01000,0.492
20,self_attn.q_proj,0.02124322,0.01000,0.521
20,self_attn.o_proj,0.11964528,0.01000,0.517
20,mlp.up_proj,0.07959354,0.01000,0.533
20,mlp.gate_proj,0.06235816,0.01000,0.511
20,mlp.down_proj,0.80122459,0.01000,2.308
21,self_attn.k_proj,0.02273879,0.01000,0.526
21,self_attn.v_proj,0.06846954,0.01000,0.494
21,self_attn.q_proj,0.02335146,0.01000,0.498
21,self_attn.o_proj,0.21736440,0.01000,0.515
21,mlp.up_proj,0.09114946,0.01000,0.533
21,mlp.gate_proj,0.07021903,0.01000,0.509
21,mlp.down_proj,1.01436162,0.01000,2.285
22,self_attn.k_proj,0.02368175,0.01000,0.515
22,self_attn.v_proj,0.07183458,0.01000,0.500
22,self_attn.q_proj,0.02609063,0.01000,0.585
22,self_attn.o_proj,0.34090981,0.01000,0.516
22,mlp.up_proj,0.10087807,0.01000,0.555
22,mlp.gate_proj,0.07864191,0.01000,0.506
22,mlp.down_proj,1.41661644,0.01000,2.276
23,self_attn.k_proj,0.02159666,0.01000,0.523
23,self_attn.v_proj,0.08762348,0.01000,0.498
23,self_attn.q_proj,0.02072346,0.01000,0.494
23,self_attn.o_proj,0.76461768,0.01000,0.515
23,mlp.up_proj,0.09932031,0.01000,0.525
23,mlp.gate_proj,0.08260745,0.01000,0.506
23,mlp.down_proj,2.73030257,0.01000,2.283
|