File size: 7,379 Bytes
ee77be3 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 | layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000033241,0.05000,1.466
0,self_attn.o_proj,0.0000001653,0.05000,0.972
0,mlp.up_proj,0.0000088873,0.05000,2.326
0,mlp.gate_proj,0.0000093133,0.05000,2.381
0,mlp.down_proj,0.0000006132,0.05000,2.897
1,self_attn.qkv_proj,0.0000256600,0.05000,1.133
1,self_attn.o_proj,0.0000002638,0.05000,1.190
1,mlp.up_proj,0.0000117479,0.05000,2.989
1,mlp.gate_proj,0.0000127222,0.05000,3.056
1,mlp.down_proj,0.0000011313,0.05000,2.995
2,self_attn.qkv_proj,0.0000549695,0.05000,1.098
2,self_attn.o_proj,0.0000003222,0.05000,1.060
2,mlp.up_proj,0.0000164835,0.05000,2.991
2,mlp.gate_proj,0.0000180576,0.05000,3.067
2,mlp.down_proj,0.0000009932,0.05000,2.948
3,self_attn.qkv_proj,0.0000797589,0.05000,1.024
3,self_attn.o_proj,0.0000005779,0.05000,1.035
3,mlp.gate_proj,0.0000227424,0.05000,2.564
3,mlp.up_proj,0.0000200395,0.05000,2.588
3,mlp.down_proj,0.0002782354,0.05000,2.898
4,self_attn.qkv_proj,0.0000732176,0.05000,1.017
4,self_attn.o_proj,0.0000009411,0.05000,1.014
4,mlp.gate_proj,0.0000293015,0.05000,2.410
4,mlp.up_proj,0.0000244080,0.05000,2.435
4,mlp.down_proj,0.0000023525,0.05000,2.982
5,self_attn.qkv_proj,0.0000933612,0.05000,1.026
5,self_attn.o_proj,0.0000017404,0.05000,1.043
5,mlp.gate_proj,0.0000357003,0.05000,2.498
5,mlp.up_proj,0.0000289614,0.05000,2.512
5,mlp.down_proj,0.0000036120,0.05000,2.905
6,self_attn.qkv_proj,0.0000769730,0.05000,1.034
6,self_attn.o_proj,0.0000019431,0.05000,0.999
6,mlp.gate_proj,0.0000366409,0.05000,2.308
6,mlp.up_proj,0.0000313463,0.05000,2.333
6,mlp.down_proj,0.0000043249,0.05000,2.952
7,self_attn.qkv_proj,0.0001243836,0.05000,1.054
7,self_attn.o_proj,0.0000031223,0.05000,1.024
7,mlp.up_proj,0.0000345948,0.05000,2.341
7,mlp.gate_proj,0.0000385413,0.05000,2.381
7,mlp.down_proj,0.0000056692,0.05000,2.957
8,self_attn.qkv_proj,0.0001220055,0.05000,1.034
8,self_attn.o_proj,0.0000041093,0.05000,1.017
8,mlp.up_proj,0.0000381113,0.05000,2.440
8,mlp.gate_proj,0.0000393560,0.05000,2.468
8,mlp.down_proj,0.0000063462,0.05000,2.941
9,self_attn.qkv_proj,0.0001055136,0.05000,1.018
9,self_attn.o_proj,0.0000038115,0.05000,1.023
9,mlp.up_proj,0.0000413347,0.05000,2.383
9,mlp.gate_proj,0.0000413403,0.05000,2.401
9,mlp.down_proj,0.0000060606,0.05000,2.969
10,self_attn.qkv_proj,0.0001138408,0.05000,1.028
10,self_attn.o_proj,0.0000050139,0.05000,1.026
10,mlp.up_proj,0.0000424914,0.05000,2.415
10,mlp.gate_proj,0.0000427714,0.05000,2.426
10,mlp.down_proj,0.0000062799,0.05000,3.024
11,self_attn.qkv_proj,0.0001136194,0.05000,1.025
11,self_attn.o_proj,0.0000053294,0.05000,1.033
11,mlp.gate_proj,0.0000435245,0.05000,2.301
11,mlp.up_proj,0.0000456607,0.05000,2.340
11,mlp.down_proj,0.0000071477,0.05000,2.955
12,self_attn.qkv_proj,0.0001161936,0.05000,1.074
12,self_attn.o_proj,0.0000050933,0.05000,1.018
12,mlp.gate_proj,0.0000425567,0.05000,2.328
12,mlp.up_proj,0.0000467951,0.05000,2.354
12,mlp.down_proj,0.0000079555,0.05000,2.941
13,self_attn.qkv_proj,0.0001463183,0.05000,1.023
13,self_attn.o_proj,0.0000080918,0.05000,1.013
13,mlp.up_proj,0.0000516755,0.05000,2.454
13,mlp.gate_proj,0.0000449235,0.05000,2.467
13,mlp.down_proj,0.0000089921,0.05000,2.883
14,self_attn.qkv_proj,0.0001305041,0.05000,1.017
14,self_attn.o_proj,0.0000074252,0.05000,1.019
14,mlp.gate_proj,0.0000498036,0.05000,2.374
14,mlp.up_proj,0.0000568754,0.05000,2.399
14,mlp.down_proj,0.0000102694,0.05000,2.953
15,self_attn.qkv_proj,0.0001450314,0.05000,1.016
15,self_attn.o_proj,0.0000070636,0.05000,1.018
15,mlp.gate_proj,0.0000541943,0.05000,2.286
15,mlp.up_proj,0.0000617730,0.05000,2.306
15,mlp.down_proj,0.0000115088,0.05000,2.977
16,self_attn.qkv_proj,0.0001367455,0.05000,1.021
16,self_attn.o_proj,0.0000106811,0.05000,1.077
16,mlp.gate_proj,0.0000558458,0.05000,2.282
16,mlp.up_proj,0.0000641705,0.05000,2.314
16,mlp.down_proj,0.0000146563,0.05000,2.944
17,self_attn.qkv_proj,0.0001290727,0.05000,1.030
17,self_attn.o_proj,0.0000075975,0.05000,1.049
17,mlp.gate_proj,0.0000583090,0.05000,2.453
17,mlp.up_proj,0.0000678901,0.05000,2.486
17,mlp.down_proj,0.0000175746,0.05000,2.974
18,self_attn.qkv_proj,0.0001274209,0.05000,1.018
18,self_attn.o_proj,0.0000124687,0.05000,1.052
18,mlp.up_proj,0.0000756719,0.05000,2.402
18,mlp.gate_proj,0.0000658952,0.05000,2.437
18,mlp.down_proj,0.0000258305,0.05000,2.968
19,self_attn.qkv_proj,0.0001435843,0.05000,1.026
19,self_attn.o_proj,0.0000158486,0.05000,1.022
19,mlp.up_proj,0.0000815260,0.05000,2.438
19,mlp.gate_proj,0.0000720414,0.05000,2.465
19,mlp.down_proj,0.0000294331,0.05000,2.928
20,self_attn.qkv_proj,0.0001412000,0.05000,1.041
20,self_attn.o_proj,0.0000198388,0.05000,1.020
20,mlp.gate_proj,0.0000866334,0.05000,2.407
20,mlp.up_proj,0.0000980211,0.05000,2.433
20,mlp.down_proj,0.0000357816,0.05000,2.969
21,self_attn.qkv_proj,0.0001619060,0.05000,1.030
21,self_attn.o_proj,0.0000168971,0.05000,1.010
21,mlp.gate_proj,0.0000912907,0.05000,2.397
21,mlp.up_proj,0.0001050032,0.05000,2.420
21,mlp.down_proj,0.0000443997,0.05000,2.936
22,self_attn.qkv_proj,0.0001537729,0.05000,1.016
22,self_attn.o_proj,0.0000249352,0.05000,1.006
22,mlp.up_proj,0.0001121257,0.05000,2.376
22,mlp.gate_proj,0.0000962384,0.05000,2.379
22,mlp.down_proj,0.0000494136,0.05000,2.923
23,self_attn.qkv_proj,0.0001589419,0.05000,1.051
23,self_attn.o_proj,0.0000104669,0.05000,1.009
23,mlp.gate_proj,0.0000999043,0.05000,2.438
23,mlp.up_proj,0.0001153954,0.05000,2.463
23,mlp.down_proj,0.0000453592,0.05000,2.927
24,self_attn.qkv_proj,0.0001645199,0.05000,1.031
24,self_attn.o_proj,0.0000096019,0.05000,1.021
24,mlp.up_proj,0.0001215475,0.05000,2.423
24,mlp.gate_proj,0.0001040655,0.05000,2.457
24,mlp.down_proj,0.0000538232,0.05000,2.972
25,self_attn.qkv_proj,0.0001800437,0.05000,1.046
25,self_attn.o_proj,0.0000219898,0.05000,1.034
25,mlp.up_proj,0.0001317978,0.05000,2.360
25,mlp.gate_proj,0.0001123926,0.05000,2.376
25,mlp.down_proj,0.0000615177,0.05000,3.004
26,self_attn.qkv_proj,0.0001578350,0.05000,1.045
26,self_attn.o_proj,0.0000382162,0.05000,1.019
26,mlp.up_proj,0.0001344800,0.05000,2.456
26,mlp.gate_proj,0.0001149784,0.05000,2.460
26,mlp.down_proj,0.0000757419,0.05000,2.945
27,self_attn.qkv_proj,0.0001475294,0.05000,1.035
27,self_attn.o_proj,0.0000206933,0.05000,1.017
27,mlp.up_proj,0.0001520072,0.05000,2.336
27,mlp.gate_proj,0.0001321883,0.05000,2.361
27,mlp.down_proj,0.0001098592,0.05000,2.962
28,self_attn.qkv_proj,0.0002010034,0.05000,1.035
28,self_attn.o_proj,0.0000312271,0.05000,1.009
28,mlp.gate_proj,0.0001526327,0.05000,2.282
28,mlp.up_proj,0.0001689870,0.05000,2.303
28,mlp.down_proj,0.0001587952,0.05000,2.939
29,self_attn.qkv_proj,0.0001802269,0.05000,1.036
29,self_attn.o_proj,0.0000341774,0.05000,1.013
29,mlp.gate_proj,0.0001712056,0.05000,2.437
29,mlp.up_proj,0.0001709735,0.05000,2.456
29,mlp.down_proj,0.0002735091,0.05000,2.917
30,self_attn.qkv_proj,0.0001263867,0.05000,1.014
30,self_attn.o_proj,0.0000344519,0.05000,1.018
30,mlp.up_proj,0.0001645436,0.05000,2.287
30,mlp.gate_proj,0.0001920412,0.05000,2.311
30,mlp.down_proj,0.0014165752,0.05000,2.951
31,self_attn.qkv_proj,0.0000026388,0.05000,1.010
31,self_attn.o_proj,0.0000037210,0.05000,1.014
31,mlp.up_proj,0.0000405552,0.05000,2.355
31,mlp.gate_proj,0.0000741658,0.05000,2.395
31,mlp.down_proj,0.0004612778,0.05000,2.959
|