File size: 8,680 Bytes
bb44350 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 |
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00034001,0.01000,0.702
0,self_attn.v_proj,0.00026275,0.01000,0.516
0,self_attn.q_proj,0.00078015,0.01000,0.472
0,self_attn.o_proj,0.00021305,0.01000,0.944
0,mlp.up_proj,0.00412678,0.01000,0.466
0,mlp.gate_proj,0.00822148,0.01000,0.479
0,mlp.down_proj,0.00023430,0.01000,1.461
1,self_attn.k_proj,0.00014082,0.01000,0.490
1,self_attn.v_proj,0.00013241,0.01000,0.586
1,self_attn.q_proj,0.00031780,0.01000,0.512
1,self_attn.o_proj,0.00004038,0.01000,1.020
1,mlp.up_proj,0.01444682,0.01000,0.496
1,mlp.gate_proj,0.04915192,0.01000,0.495
1,mlp.down_proj,0.00029908,0.01000,1.443
2,self_attn.k_proj,0.00026053,0.01000,0.468
2,self_attn.v_proj,0.00024813,0.01000,0.477
2,self_attn.q_proj,0.00060980,0.01000,0.515
2,self_attn.o_proj,0.00006841,0.01000,1.000
2,mlp.up_proj,0.01214469,0.01000,0.488
2,mlp.gate_proj,0.03373746,0.01000,0.526
2,mlp.down_proj,0.01297616,0.01000,1.444
3,self_attn.k_proj,0.00230989,0.01000,0.465
3,self_attn.v_proj,0.00233178,0.01000,0.470
3,self_attn.q_proj,0.00470302,0.01000,0.480
3,self_attn.o_proj,0.00012092,0.01000,1.027
3,mlp.up_proj,0.01660008,0.01000,0.603
3,mlp.gate_proj,0.04289370,0.01000,0.484
3,mlp.down_proj,0.00092249,0.01000,1.553
4,self_attn.k_proj,0.00206668,0.01000,0.468
4,self_attn.v_proj,0.00214147,0.01000,0.476
4,self_attn.q_proj,0.00418732,0.01000,-1.693
4,self_attn.o_proj,0.00030304,0.01000,0.958
4,mlp.up_proj,0.01767924,0.01000,0.577
4,mlp.gate_proj,0.04030780,0.01000,0.628
4,mlp.down_proj,0.00111819,0.01000,1.658
5,self_attn.k_proj,0.00309932,0.01000,0.472
5,self_attn.v_proj,0.00331202,0.01000,0.475
5,self_attn.q_proj,0.00744162,0.01000,0.474
5,self_attn.o_proj,0.00036463,0.01000,0.938
5,mlp.up_proj,0.01660982,0.01000,0.518
5,mlp.gate_proj,0.02776664,0.01000,0.543
5,mlp.down_proj,0.00127475,0.01000,1.419
6,self_attn.k_proj,0.00246792,0.01000,0.541
6,self_attn.v_proj,0.00227531,0.01000,0.496
6,self_attn.q_proj,0.00543098,0.01000,0.474
6,self_attn.o_proj,0.00031531,0.01000,0.913
6,mlp.up_proj,0.02119459,0.01000,0.491
6,mlp.gate_proj,0.03364027,0.01000,0.556
6,mlp.down_proj,0.00169318,0.01000,1.440
7,self_attn.k_proj,0.00427833,0.01000,0.467
7,self_attn.v_proj,0.00491385,0.01000,0.468
7,self_attn.q_proj,0.01039105,0.01000,0.461
7,self_attn.o_proj,0.00045247,0.01000,1.037
7,mlp.up_proj,0.02380912,0.01000,0.474
7,mlp.gate_proj,0.03846249,0.01000,0.477
7,mlp.down_proj,0.00207670,0.01000,1.418
8,self_attn.k_proj,0.00580886,0.01000,0.458
8,self_attn.v_proj,0.00546446,0.01000,0.457
8,self_attn.q_proj,0.01283393,0.01000,0.464
8,self_attn.o_proj,0.00049309,0.01000,0.930
8,mlp.up_proj,0.02529081,0.01000,0.506
8,mlp.gate_proj,0.03940681,0.01000,0.549
8,mlp.down_proj,0.00239061,0.01000,1.463
9,self_attn.k_proj,0.01022408,0.01000,0.466
9,self_attn.v_proj,0.01063569,0.01000,0.464
9,self_attn.q_proj,0.02464896,0.01000,0.456
9,self_attn.o_proj,0.00082228,0.01000,0.913
9,mlp.up_proj,0.02869781,0.01000,0.475
9,mlp.gate_proj,0.04569711,0.01000,0.495
9,mlp.down_proj,0.00334036,0.01000,1.488
10,self_attn.k_proj,0.00897335,0.01000,0.463
10,self_attn.v_proj,0.00938525,0.01000,0.476
10,self_attn.q_proj,0.02165450,0.01000,0.472
10,self_attn.o_proj,0.00080374,0.01000,0.915
10,mlp.up_proj,0.02908845,0.01000,0.459
10,mlp.gate_proj,0.04619259,0.01000,0.469
10,mlp.down_proj,0.00457235,0.01000,1.560
11,self_attn.k_proj,0.01702636,0.01000,0.470
11,self_attn.v_proj,0.01571462,0.01000,0.448
11,self_attn.q_proj,0.04408321,0.01000,0.460
11,self_attn.o_proj,0.00194463,0.01000,0.917
11,mlp.up_proj,0.02965630,0.01000,0.471
11,mlp.gate_proj,0.03877314,0.01000,0.465
11,mlp.down_proj,0.00576400,0.01000,-0.688
12,self_attn.k_proj,0.01535154,0.01000,0.461
12,self_attn.v_proj,0.01573815,0.01000,0.463
12,self_attn.q_proj,0.04120466,0.01000,0.464
12,self_attn.o_proj,0.00082521,0.01000,0.993
12,mlp.up_proj,0.02786373,0.01000,0.508
12,mlp.gate_proj,0.03390844,0.01000,0.500
12,mlp.down_proj,0.00530050,0.01000,1.504
13,self_attn.k_proj,0.01469768,0.01000,0.532
13,self_attn.v_proj,0.01746682,0.01000,0.644
13,self_attn.q_proj,0.04317660,0.01000,0.650
13,self_attn.o_proj,0.00115520,0.01000,0.997
13,mlp.up_proj,0.02967896,0.01000,0.475
13,mlp.gate_proj,0.03677811,0.01000,0.458
13,mlp.down_proj,0.00540835,0.01000,1.386
14,self_attn.k_proj,0.01980565,0.01000,0.452
14,self_attn.v_proj,0.02136633,0.01000,0.458
14,self_attn.q_proj,0.05437878,0.01000,0.463
14,self_attn.o_proj,0.00118582,0.01000,0.909
14,mlp.up_proj,0.03194932,0.01000,0.581
14,mlp.gate_proj,0.03921878,0.01000,0.569
14,mlp.down_proj,0.00719125,0.01000,1.398
15,self_attn.k_proj,0.03463616,0.01000,0.614
15,self_attn.v_proj,0.04363632,0.01000,0.560
15,self_attn.q_proj,0.10855717,0.01000,0.587
15,self_attn.o_proj,0.00174209,0.01000,1.039
15,mlp.up_proj,0.03514949,0.01000,0.517
15,mlp.gate_proj,0.04189382,0.01000,0.461
15,mlp.down_proj,0.00778224,0.01000,1.585
16,self_attn.k_proj,0.05131978,0.01000,0.457
16,self_attn.v_proj,0.04501638,0.01000,0.453
16,self_attn.q_proj,0.13748899,0.01000,0.460
16,self_attn.o_proj,0.00201723,0.01000,0.920
16,mlp.up_proj,0.04067000,0.01000,0.425
16,mlp.gate_proj,0.04500043,0.01000,0.482
16,mlp.down_proj,0.01533213,0.01000,-0.971
17,self_attn.k_proj,0.10121436,0.01000,0.362
17,self_attn.v_proj,0.12345707,0.01000,0.434
17,self_attn.q_proj,0.30684415,0.01000,0.469
17,self_attn.o_proj,0.00474120,0.01000,0.883
17,mlp.up_proj,0.05722951,0.01000,0.361
17,mlp.gate_proj,0.06477357,0.01000,0.368
17,mlp.down_proj,0.01754329,0.01000,1.108
18,self_attn.k_proj,0.09428492,0.01000,0.359
18,self_attn.v_proj,0.10053023,0.01000,-1.804
18,self_attn.q_proj,0.29437009,0.01000,0.374
18,self_attn.o_proj,0.00352678,0.01000,0.796
18,mlp.up_proj,0.06900685,0.01000,0.379
18,mlp.gate_proj,0.07904451,0.01000,0.397
18,mlp.down_proj,0.02755920,0.01000,1.105
19,self_attn.k_proj,0.16187871,0.01000,0.356
19,self_attn.v_proj,0.20003729,0.01000,0.351
19,self_attn.q_proj,0.52686477,0.01000,0.369
19,self_attn.o_proj,0.00656477,0.01000,0.893
19,mlp.up_proj,0.08853976,0.01000,0.449
19,mlp.gate_proj,0.08336402,0.01000,0.426
19,mlp.down_proj,0.05588865,0.01000,1.080
20,self_attn.k_proj,0.22524926,0.01000,-2.716
20,self_attn.v_proj,0.26741582,0.01000,0.359
20,self_attn.q_proj,0.65623856,0.01000,0.358
20,self_attn.o_proj,0.00873903,0.01000,0.703
20,mlp.up_proj,0.09712939,0.01000,0.365
20,mlp.gate_proj,0.08698984,0.01000,0.385
20,mlp.down_proj,0.06682739,0.01000,1.080
21,self_attn.k_proj,0.39126575,0.01000,0.358
21,self_attn.v_proj,0.50307965,0.01000,0.393
21,self_attn.q_proj,1.09633744,0.01000,0.364
21,self_attn.o_proj,0.01702069,0.01000,0.759
21,mlp.up_proj,0.11749193,0.01000,0.390
21,mlp.gate_proj,0.09473881,0.01000,0.367
21,mlp.down_proj,0.09391166,0.01000,1.339
22,self_attn.k_proj,0.42912284,0.01000,0.366
22,self_attn.v_proj,0.62853205,0.01000,0.363
22,self_attn.q_proj,1.13549972,0.01000,0.362
22,self_attn.o_proj,0.01342478,0.01000,0.734
22,mlp.up_proj,0.12709107,0.01000,0.371
22,mlp.gate_proj,0.10018895,0.01000,0.380
22,mlp.down_proj,0.10143830,0.01000,1.094
23,self_attn.k_proj,0.59195518,0.01000,0.474
23,self_attn.v_proj,0.68701136,0.01000,0.384
23,self_attn.q_proj,1.32605648,0.01000,0.414
23,self_attn.o_proj,0.01738492,0.01000,0.719
23,mlp.up_proj,0.14314744,0.01000,0.361
23,mlp.gate_proj,0.11007850,0.01000,0.408
23,mlp.down_proj,0.10754839,0.01000,1.478
24,self_attn.k_proj,1.00415301,0.01000,0.361
24,self_attn.v_proj,1.12105525,0.01000,0.355
24,self_attn.q_proj,2.56474996,0.01000,0.358
24,self_attn.o_proj,0.02551685,0.01000,0.712
24,mlp.up_proj,0.13545924,0.01000,0.408
24,mlp.gate_proj,0.10024798,0.01000,0.363
24,mlp.down_proj,0.10790002,0.01000,1.191
25,self_attn.k_proj,1.19017565,0.01000,0.356
25,self_attn.v_proj,1.88630354,0.01000,0.358
25,self_attn.q_proj,3.16219616,0.01000,0.353
25,self_attn.o_proj,0.03715168,0.01000,0.753
25,mlp.up_proj,0.13330801,0.01000,0.360
25,mlp.gate_proj,0.09387642,0.01000,0.368
25,mlp.down_proj,0.13108285,0.01000,1.079
26,self_attn.k_proj,1.18263948,0.01000,0.436
26,self_attn.v_proj,1.67280781,0.01000,0.470
26,self_attn.q_proj,3.34765911,0.01000,0.454
26,self_attn.o_proj,0.09499875,0.01000,0.728
26,mlp.up_proj,0.14457943,0.01000,0.355
26,mlp.gate_proj,0.10359854,0.01000,0.367
26,mlp.down_proj,0.20188543,0.01000,1.095
27,self_attn.k_proj,0.88096058,0.01000,0.350
27,self_attn.v_proj,1.04464459,0.01000,0.357
27,self_attn.q_proj,1.89896679,0.01000,0.349
27,self_attn.o_proj,0.05569953,0.01000,0.722
27,mlp.up_proj,0.25829488,0.01000,0.365
27,mlp.gate_proj,0.24046963,0.01000,0.367
27,mlp.down_proj,0.23538056,0.01000,1.094
|