File size: 7,490 Bytes
fb8ba82 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.77682245,0.01000,1.285
0,self_attn.v_proj,0.03500944,0.01000,0.555
0,self_attn.q_proj,0.99208140,0.01000,0.586
0,self_attn.o_proj,0.02151467,0.01000,0.622
0,mlp.up_proj,0.48560226,0.01000,0.688
0,mlp.gate_proj,0.51454079,0.01000,0.684
0,mlp.down_proj,0.50206679,0.01000,2.690
1,self_attn.k_proj,1.51786375,0.01000,0.619
1,self_attn.v_proj,0.34056193,0.01000,0.603
1,self_attn.q_proj,1.77233434,0.01000,0.599
1,self_attn.o_proj,0.13850473,0.01000,0.699
1,mlp.up_proj,1.10941112,0.01000,0.641
1,mlp.gate_proj,1.28043342,0.01000,0.611
1,mlp.down_proj,14.51999855,0.01000,2.696
2,self_attn.k_proj,2.82318068,0.01000,0.617
2,self_attn.v_proj,1.09324777,0.01000,0.582
2,self_attn.q_proj,3.20169973,0.01000,0.566
2,self_attn.o_proj,0.28864872,0.01000,0.662
2,mlp.up_proj,1.84167004,0.01000,0.590
2,mlp.gate_proj,2.07128930,0.01000,0.559
2,mlp.down_proj,1.27372789,0.01000,2.587
3,self_attn.k_proj,3.76621532,0.01000,0.643
3,self_attn.v_proj,1.56358862,0.01000,0.610
3,self_attn.q_proj,3.76481605,0.01000,0.616
3,self_attn.o_proj,0.44352189,0.01000,0.647
3,mlp.up_proj,2.52457261,0.01000,0.603
3,mlp.gate_proj,2.64974737,0.01000,0.623
3,mlp.down_proj,2.54826880,0.01000,2.554
4,self_attn.k_proj,4.20260096,0.01000,0.540
4,self_attn.v_proj,1.82544005,0.01000,0.488
4,self_attn.q_proj,4.33011675,0.01000,0.489
4,self_attn.o_proj,0.81763673,0.01000,0.535
4,mlp.up_proj,3.34401894,0.01000,0.512
4,mlp.gate_proj,3.44722080,0.01000,0.494
4,mlp.down_proj,3.73280597,0.01000,2.436
5,self_attn.k_proj,4.16551399,0.01000,0.610
5,self_attn.v_proj,1.92370594,0.01000,0.588
5,self_attn.q_proj,4.34254456,0.01000,0.635
5,self_attn.o_proj,0.96646106,0.01000,0.586
5,mlp.up_proj,4.14636469,0.01000,0.603
5,mlp.gate_proj,4.12169456,0.01000,0.585
5,mlp.down_proj,4.96067905,0.01000,2.481
6,self_attn.k_proj,4.64315891,0.01000,0.489
6,self_attn.v_proj,2.31881714,0.01000,0.467
6,self_attn.q_proj,4.96351624,0.01000,0.477
6,self_attn.o_proj,1.36653817,0.01000,0.526
6,mlp.up_proj,4.88970184,0.01000,0.503
6,mlp.gate_proj,4.76923084,0.01000,0.486
6,mlp.down_proj,6.02524185,0.01000,2.185
7,self_attn.k_proj,4.66848373,0.01000,0.489
7,self_attn.v_proj,2.31519604,0.01000,0.464
7,self_attn.q_proj,5.79233074,0.01000,0.480
7,self_attn.o_proj,2.15676284,0.01000,0.488
7,mlp.up_proj,6.20312214,0.01000,0.497
7,mlp.gate_proj,5.80423927,0.01000,0.483
7,mlp.down_proj,39.07165527,0.01000,2.213
8,self_attn.k_proj,4.63509369,0.01000,0.484
8,self_attn.v_proj,3.28440690,0.01000,0.523
8,self_attn.q_proj,4.71225929,0.01000,0.500
8,self_attn.o_proj,3.75382185,0.01000,0.488
8,mlp.up_proj,7.29536915,0.01000,0.504
8,mlp.gate_proj,6.96828270,0.01000,0.483
8,mlp.down_proj,11.49938583,0.01000,2.198
9,self_attn.k_proj,4.39791918,0.01000,0.498
9,self_attn.v_proj,2.88585830,0.01000,0.475
9,self_attn.q_proj,4.44140625,0.01000,0.489
9,self_attn.o_proj,4.38107252,0.01000,0.494
9,mlp.up_proj,7.57919312,0.01000,0.538
9,mlp.gate_proj,6.68407631,0.01000,0.484
9,mlp.down_proj,12.43455696,0.01000,2.212
10,self_attn.k_proj,4.90410137,0.01000,0.495
10,self_attn.v_proj,3.14827299,0.01000,0.476
10,self_attn.q_proj,5.09773064,0.01000,0.483
10,self_attn.o_proj,5.91220951,0.01000,0.493
10,mlp.up_proj,7.54940319,0.01000,0.522
10,mlp.gate_proj,6.77607632,0.01000,0.526
10,mlp.down_proj,14.59228039,0.01000,2.282
11,self_attn.k_proj,4.83724689,0.01000,0.495
11,self_attn.v_proj,3.04819179,0.01000,0.472
11,self_attn.q_proj,5.13493776,0.01000,0.481
11,self_attn.o_proj,6.75608921,0.01000,0.494
11,mlp.up_proj,7.71922398,0.01000,0.582
11,mlp.gate_proj,6.97108126,0.01000,0.491
11,mlp.down_proj,15.99707985,0.01000,2.207
12,self_attn.k_proj,5.48999071,0.01000,0.492
12,self_attn.v_proj,4.52012539,0.01000,0.469
12,self_attn.q_proj,5.99069595,0.01000,0.477
12,self_attn.o_proj,9.85486317,0.01000,0.488
12,mlp.up_proj,8.40734291,0.01000,0.503
12,mlp.gate_proj,7.56645966,0.01000,0.485
12,mlp.down_proj,21.01655579,0.01000,2.215
13,self_attn.k_proj,5.33678246,0.01000,0.491
13,self_attn.v_proj,3.92936134,0.01000,0.472
13,self_attn.q_proj,5.71902800,0.01000,0.480
13,self_attn.o_proj,8.64190197,0.01000,0.539
13,mlp.up_proj,8.67692661,0.01000,0.501
13,mlp.gate_proj,7.80695248,0.01000,0.502
13,mlp.down_proj,24.07814026,0.01000,2.222
14,self_attn.k_proj,5.57279205,0.01000,0.483
14,self_attn.v_proj,4.35658169,0.01000,0.476
14,self_attn.q_proj,5.51688099,0.01000,0.486
14,self_attn.o_proj,10.84986401,0.01000,0.490
14,mlp.up_proj,9.46220016,0.01000,0.509
14,mlp.gate_proj,8.29815006,0.01000,0.486
14,mlp.down_proj,33.66066742,0.01000,2.208
15,self_attn.k_proj,5.96792984,0.01000,0.489
15,self_attn.v_proj,6.85978556,0.01000,0.534
15,self_attn.q_proj,6.19756794,0.01000,0.491
15,self_attn.o_proj,15.63127327,0.01000,0.486
15,mlp.up_proj,10.45367622,0.01000,0.501
15,mlp.gate_proj,8.97001839,0.01000,0.478
15,mlp.down_proj,44.43462753,0.01000,2.187
16,self_attn.k_proj,6.45448399,0.01000,0.488
16,self_attn.v_proj,6.49105835,0.01000,0.468
16,self_attn.q_proj,6.57531500,0.01000,0.476
16,self_attn.o_proj,17.50428772,0.01000,0.486
16,mlp.up_proj,13.01940155,0.01000,0.512
16,mlp.gate_proj,10.95333672,0.01000,0.483
16,mlp.down_proj,66.79670715,0.01000,2.182
17,self_attn.k_proj,6.14941597,0.01000,0.485
17,self_attn.v_proj,8.96719837,0.01000,0.521
17,self_attn.q_proj,6.27163982,0.01000,0.532
17,self_attn.o_proj,30.05414200,0.01000,0.483
17,mlp.up_proj,15.46764755,0.01000,0.499
17,mlp.gate_proj,13.17247581,0.01000,0.478
17,mlp.down_proj,95.98254395,0.01000,2.191
18,self_attn.k_proj,5.98577356,0.01000,0.488
18,self_attn.v_proj,10.22346210,0.01000,0.468
18,self_attn.q_proj,6.29689360,0.01000,0.474
18,self_attn.o_proj,32.41912842,0.01000,0.481
18,mlp.up_proj,19.32838058,0.01000,0.565
18,mlp.gate_proj,15.88508987,0.01000,0.480
18,mlp.down_proj,148.66180420,0.01000,2.194
19,self_attn.k_proj,6.26510525,0.01000,0.487
19,self_attn.v_proj,13.85520744,0.01000,0.474
19,self_attn.q_proj,6.57017851,0.01000,0.473
19,self_attn.o_proj,35.20966721,0.01000,0.480
19,mlp.up_proj,22.48669624,0.01000,0.497
19,mlp.gate_proj,17.89473343,0.01000,0.481
19,mlp.down_proj,204.57714844,0.01000,2.171
20,self_attn.k_proj,6.23155594,0.01000,0.495
20,self_attn.v_proj,16.45906067,0.01000,0.476
20,self_attn.q_proj,6.64905834,0.01000,0.482
20,self_attn.o_proj,37.22135925,0.01000,0.502
20,mlp.up_proj,24.94277191,0.01000,0.501
20,mlp.gate_proj,19.56863976,0.01000,0.479
20,mlp.down_proj,253.60627747,0.01000,2.163
21,self_attn.k_proj,7.11655140,0.01000,0.485
21,self_attn.v_proj,21.37878990,0.01000,0.468
21,self_attn.q_proj,7.32550526,0.01000,0.471
21,self_attn.o_proj,64.90080261,0.01000,0.486
21,mlp.up_proj,28.40076065,0.01000,0.499
21,mlp.gate_proj,21.86407471,0.01000,0.476
21,mlp.down_proj,320.12417603,0.01000,2.247
22,self_attn.k_proj,7.32285166,0.01000,0.497
22,self_attn.v_proj,22.15027618,0.01000,0.473
22,self_attn.q_proj,8.15643311,0.01000,0.481
22,self_attn.o_proj,102.47914124,0.01000,0.485
22,mlp.up_proj,30.92877579,0.01000,0.504
22,mlp.gate_proj,24.13090897,0.01000,0.485
22,mlp.down_proj,418.65206909,0.01000,2.209
23,self_attn.k_proj,6.63460350,0.01000,0.489
23,self_attn.v_proj,26.71226501,0.01000,0.472
23,self_attn.q_proj,6.39267826,0.01000,0.481
23,self_attn.o_proj,234.22763062,0.01000,0.486
23,mlp.up_proj,31.12707901,0.01000,0.500
23,mlp.gate_proj,25.93458557,0.01000,0.479
23,mlp.down_proj,868.38049316,0.01000,2.240
|