File size: 7,379 Bytes
f09e7d3 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 | layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000036928,0.05000,1.790
0,self_attn.o_proj,0.0000001945,0.05000,1.331
0,mlp.up_proj,0.0000102390,0.05000,2.562
0,mlp.gate_proj,0.0000106993,0.05000,2.597
0,mlp.down_proj,0.0000007873,0.05000,3.140
1,self_attn.qkv_proj,0.0000288658,0.05000,1.350
1,self_attn.o_proj,0.0000003944,0.05000,1.314
1,mlp.up_proj,0.0000151884,0.05000,3.192
1,mlp.gate_proj,0.0000162423,0.05000,3.248
1,mlp.down_proj,0.0000017862,0.05000,3.335
2,self_attn.qkv_proj,0.0000672307,0.05000,1.265
2,self_attn.o_proj,0.0000004262,0.05000,1.162
2,mlp.up_proj,0.0000219007,0.05000,2.728
2,mlp.gate_proj,0.0000236388,0.05000,2.739
2,mlp.down_proj,0.0000015235,0.05000,3.191
3,self_attn.qkv_proj,0.0000958284,0.05000,1.113
3,self_attn.o_proj,0.0000007994,0.05000,1.071
3,mlp.gate_proj,0.0000320000,0.05000,2.401
3,mlp.up_proj,0.0000289537,0.05000,2.435
3,mlp.down_proj,0.0003337474,0.05000,3.272
4,self_attn.qkv_proj,0.0000909789,0.05000,1.106
4,self_attn.o_proj,0.0000012312,0.05000,1.100
4,mlp.up_proj,0.0000345329,0.05000,2.538
4,mlp.gate_proj,0.0000400292,0.05000,2.554
4,mlp.down_proj,0.0000039765,0.05000,3.210
5,self_attn.qkv_proj,0.0001159516,0.05000,1.133
5,self_attn.o_proj,0.0000017395,0.05000,1.128
5,mlp.up_proj,0.0000430088,0.05000,2.448
5,mlp.gate_proj,0.0000509520,0.05000,2.467
5,mlp.down_proj,0.0000057463,0.05000,3.189
6,self_attn.qkv_proj,0.0000961327,0.05000,1.115
6,self_attn.o_proj,0.0000022428,0.05000,1.125
6,mlp.up_proj,0.0000430322,0.05000,2.552
6,mlp.gate_proj,0.0000487083,0.05000,2.587
6,mlp.down_proj,0.0000063000,0.05000,3.109
7,self_attn.qkv_proj,0.0001434261,0.05000,1.093
7,self_attn.o_proj,0.0000029053,0.05000,1.076
7,mlp.up_proj,0.0000461718,0.05000,2.553
7,mlp.gate_proj,0.0000501546,0.05000,2.579
7,mlp.down_proj,0.0000080737,0.05000,3.201
8,self_attn.qkv_proj,0.0001350463,0.05000,1.091
8,self_attn.o_proj,0.0000040604,0.05000,1.109
8,mlp.up_proj,0.0000482156,0.05000,2.403
8,mlp.gate_proj,0.0000492231,0.05000,2.431
8,mlp.down_proj,0.0000089525,0.05000,3.215
9,self_attn.qkv_proj,0.0001197565,0.05000,1.137
9,self_attn.o_proj,0.0000039595,0.05000,1.111
9,mlp.up_proj,0.0000522804,0.05000,2.498
9,mlp.gate_proj,0.0000520745,0.05000,2.531
9,mlp.down_proj,0.0000084691,0.05000,3.158
10,self_attn.qkv_proj,0.0001285350,0.05000,1.141
10,self_attn.o_proj,0.0000056212,0.05000,1.134
10,mlp.up_proj,0.0000538686,0.05000,2.537
10,mlp.gate_proj,0.0000539127,0.05000,2.535
10,mlp.down_proj,0.0000092388,0.05000,3.212
11,self_attn.qkv_proj,0.0001265468,0.05000,1.102
11,self_attn.o_proj,0.0000049263,0.05000,1.106
11,mlp.up_proj,0.0000561754,0.05000,2.543
11,mlp.gate_proj,0.0000538750,0.05000,2.569
11,mlp.down_proj,0.0000098257,0.05000,3.231
12,self_attn.qkv_proj,0.0001307771,0.05000,1.150
12,self_attn.o_proj,0.0000049451,0.05000,1.125
12,mlp.gate_proj,0.0000524987,0.05000,2.460
12,mlp.up_proj,0.0000571596,0.05000,2.484
12,mlp.down_proj,0.0000116566,0.05000,3.190
13,self_attn.qkv_proj,0.0001563531,0.05000,1.108
13,self_attn.o_proj,0.0000065090,0.05000,1.103
13,mlp.up_proj,0.0000612276,0.05000,2.490
13,mlp.gate_proj,0.0000543759,0.05000,2.508
13,mlp.down_proj,0.0000127317,0.05000,3.187
14,self_attn.qkv_proj,0.0001393042,0.05000,1.131
14,self_attn.o_proj,0.0000061571,0.05000,1.116
14,mlp.gate_proj,0.0000600704,0.05000,2.562
14,mlp.up_proj,0.0000672100,0.05000,2.584
14,mlp.down_proj,0.0000145146,0.05000,3.154
15,self_attn.qkv_proj,0.0001545983,0.05000,1.100
15,self_attn.o_proj,0.0000057894,0.05000,1.103
15,mlp.gate_proj,0.0000662487,0.05000,2.484
15,mlp.up_proj,0.0000739427,0.05000,2.506
15,mlp.down_proj,0.0000164698,0.05000,3.217
16,self_attn.qkv_proj,0.0001466132,0.05000,1.126
16,self_attn.o_proj,0.0000097625,0.05000,1.116
16,mlp.up_proj,0.0000786630,0.05000,2.562
16,mlp.gate_proj,0.0000699401,0.05000,2.584
16,mlp.down_proj,0.0000218803,0.05000,3.116
17,self_attn.qkv_proj,0.0001490546,0.05000,1.142
17,self_attn.o_proj,0.0000076505,0.05000,1.103
17,mlp.up_proj,0.0000841039,0.05000,2.591
17,mlp.gate_proj,0.0000739672,0.05000,2.615
17,mlp.down_proj,0.0000262042,0.05000,3.182
18,self_attn.qkv_proj,0.0001470632,0.05000,1.166
18,self_attn.o_proj,0.0000125533,0.05000,1.141
18,mlp.up_proj,0.0000932287,0.05000,2.532
18,mlp.gate_proj,0.0000829974,0.05000,2.548
18,mlp.down_proj,0.0000385317,0.05000,3.301
19,self_attn.qkv_proj,0.0001654606,0.05000,1.171
19,self_attn.o_proj,0.0000149239,0.05000,1.165
19,mlp.up_proj,0.0000991290,0.05000,2.623
19,mlp.gate_proj,0.0000894585,0.05000,2.664
19,mlp.down_proj,0.0000435778,0.05000,3.377
20,self_attn.qkv_proj,0.0001578730,0.05000,1.156
20,self_attn.o_proj,0.0000184642,0.05000,1.195
20,mlp.up_proj,0.0001209617,0.05000,2.661
20,mlp.gate_proj,0.0001092768,0.05000,2.687
20,mlp.down_proj,0.0000563793,0.05000,3.294
21,self_attn.qkv_proj,0.0001870555,0.05000,1.213
21,self_attn.o_proj,0.0000136906,0.05000,1.101
21,mlp.gate_proj,0.0001159161,0.05000,2.587
21,mlp.up_proj,0.0001299713,0.05000,2.605
21,mlp.down_proj,0.0000704598,0.05000,3.190
22,self_attn.qkv_proj,0.0001782628,0.05000,1.132
22,self_attn.o_proj,0.0000249007,0.05000,1.132
22,mlp.up_proj,0.0001397206,0.05000,2.564
22,mlp.gate_proj,0.0001231925,0.05000,2.572
22,mlp.down_proj,0.0000832951,0.05000,3.299
23,self_attn.qkv_proj,0.0001967909,0.05000,1.156
23,self_attn.o_proj,0.0000105388,0.05000,1.119
23,mlp.gate_proj,0.0001326374,0.05000,2.511
23,mlp.up_proj,0.0001492243,0.05000,2.540
23,mlp.down_proj,0.0000830157,0.05000,3.201
24,self_attn.qkv_proj,0.0002110393,0.05000,1.125
24,self_attn.o_proj,0.0000124396,0.05000,1.090
24,mlp.up_proj,0.0001615396,0.05000,2.512
24,mlp.gate_proj,0.0001421848,0.05000,2.535
24,mlp.down_proj,0.0000963378,0.05000,3.219
25,self_attn.qkv_proj,0.0002265083,0.05000,1.141
25,self_attn.o_proj,0.0000209731,0.05000,1.112
25,mlp.gate_proj,0.0001558134,0.05000,2.658
25,mlp.up_proj,0.0001774229,0.05000,2.676
25,mlp.down_proj,0.0001089506,0.05000,3.236
26,self_attn.qkv_proj,0.0001990848,0.05000,1.134
26,self_attn.o_proj,0.0000347294,0.05000,1.136
26,mlp.up_proj,0.0001846280,0.05000,2.560
26,mlp.gate_proj,0.0001625094,0.05000,2.582
26,mlp.down_proj,0.0001322558,0.05000,3.308
27,self_attn.qkv_proj,0.0001973591,0.05000,1.118
27,self_attn.o_proj,0.0000244647,0.05000,1.148
27,mlp.gate_proj,0.0001797843,0.05000,2.541
27,mlp.up_proj,0.0002011022,0.05000,2.557
27,mlp.down_proj,0.0001692445,0.05000,3.208
28,self_attn.qkv_proj,0.0002489807,0.05000,1.203
28,self_attn.o_proj,0.0000308398,0.05000,1.119
28,mlp.up_proj,0.0002172940,0.05000,2.558
28,mlp.gate_proj,0.0002009149,0.05000,2.579
28,mlp.down_proj,0.0002246512,0.05000,3.171
29,self_attn.qkv_proj,0.0002247108,0.05000,1.150
29,self_attn.o_proj,0.0000370290,0.05000,1.123
29,mlp.gate_proj,0.0002232223,0.05000,2.595
29,mlp.up_proj,0.0002207740,0.05000,2.619
29,mlp.down_proj,0.0003816118,0.05000,3.237
30,self_attn.qkv_proj,0.0001591859,0.05000,1.131
30,self_attn.o_proj,0.0000362225,0.05000,1.087
30,mlp.gate_proj,0.0002359733,0.05000,2.611
30,mlp.up_proj,0.0002075650,0.05000,2.634
30,mlp.down_proj,0.0014728911,0.05000,3.272
31,self_attn.qkv_proj,0.0000035844,0.05000,1.131
31,self_attn.o_proj,0.0000039555,0.05000,1.124
31,mlp.gate_proj,0.0001033877,0.05000,2.621
31,mlp.up_proj,0.0000604577,0.05000,2.628
31,mlp.down_proj,0.0004907257,0.05000,3.331
|