File size: 5,167 Bytes
23d2638 c2f2da4 23d2638 c2f2da4 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 | layer,module,loss,samples,damp,time
0,self_attn.v_proj,0.0000000385,0.01000,1.846
0,self_attn.k_proj,0.0000015441,0.01000,1.886
0,self_attn.q_proj,0.0000031392,0.01000,1.902
0,self_attn.o_proj,0.0000000037,0.01000,0.592
0,mlp.gate_proj,0.0000034816,0.01000,1.064
0,mlp.up_proj,0.0000027458,0.01000,1.101
0,mlp.down_proj,0.0000000218,0.01000,2.363
1,self_attn.k_proj,0.0000025944,0.01000,1.784
1,self_attn.v_proj,0.0000001495,0.01000,1.796
1,self_attn.q_proj,0.0000049469,0.01000,1.799
1,self_attn.o_proj,0.0000000131,0.01000,0.588
1,mlp.up_proj,0.0000038689,0.01000,1.032
1,mlp.gate_proj,0.0000053631,0.01000,1.068
1,mlp.down_proj,0.0000039940,0.01000,2.305
2,self_attn.v_proj,0.0000003579,0.01000,1.772
2,self_attn.q_proj,0.0000101736,0.01000,1.782
2,self_attn.k_proj,0.0000053271,0.01000,1.804
2,self_attn.o_proj,0.0000000173,0.01000,0.567
2,mlp.gate_proj,0.0000081035,0.01000,1.035
2,mlp.up_proj,0.0000049758,0.01000,1.035
2,mlp.down_proj,0.0000000698,0.01000,2.244
3,self_attn.v_proj,0.0000004568,0.01000,1.787
3,self_attn.q_proj,0.0000073714,0.01000,1.793
3,self_attn.k_proj,0.0000033302,0.01000,1.806
3,self_attn.o_proj,0.0000000331,0.01000,0.560
3,mlp.up_proj,0.0000060278,0.01000,1.064
3,mlp.gate_proj,0.0000124006,0.01000,1.108
3,mlp.down_proj,0.0000001048,0.01000,2.291
4,self_attn.q_proj,0.0000074171,0.01000,1.792
4,self_attn.k_proj,0.0000035654,0.01000,1.807
4,self_attn.v_proj,0.0000004238,0.01000,1.811
4,self_attn.o_proj,0.0000000512,0.01000,0.574
4,mlp.gate_proj,0.0000136872,0.01000,1.086
4,mlp.up_proj,0.0000060945,0.01000,1.123
4,mlp.down_proj,0.0000001183,0.01000,2.384
5,self_attn.k_proj,0.0000056526,0.01000,1.750
5,self_attn.q_proj,0.0000097203,0.01000,1.787
5,self_attn.v_proj,0.0000003722,0.01000,1.796
5,self_attn.o_proj,0.0000000521,0.01000,0.564
5,mlp.up_proj,0.0000065243,0.01000,1.095
5,mlp.gate_proj,0.0000125177,0.01000,1.095
5,mlp.down_proj,0.0000001387,0.01000,2.292
6,self_attn.k_proj,0.0000044023,0.01000,1.762
6,self_attn.v_proj,0.0000004759,0.01000,1.772
6,self_attn.q_proj,0.0000069243,0.01000,1.795
6,self_attn.o_proj,0.0000000774,0.01000,0.552
6,mlp.gate_proj,0.0000123539,0.01000,1.057
6,mlp.up_proj,0.0000065727,0.01000,1.100
6,mlp.down_proj,0.0000001390,0.01000,2.231
7,self_attn.k_proj,0.0000043861,0.01000,1.772
7,self_attn.v_proj,0.0000005450,0.01000,1.780
7,self_attn.q_proj,0.0000082903,0.01000,1.800
7,self_attn.o_proj,0.0000000725,0.01000,0.531
7,mlp.up_proj,0.0000068659,0.01000,1.067
7,mlp.gate_proj,0.0000115620,0.01000,1.102
7,mlp.down_proj,0.0000001555,0.01000,2.270
8,self_attn.k_proj,0.0000052875,0.01000,1.729
8,self_attn.v_proj,0.0000005141,0.01000,1.794
8,self_attn.q_proj,0.0000086041,0.01000,1.805
8,self_attn.o_proj,0.0000000941,0.01000,0.552
8,mlp.up_proj,0.0000076312,0.01000,1.017
8,mlp.gate_proj,0.0000125952,0.01000,1.054
8,mlp.down_proj,0.0000002089,0.01000,2.491
9,self_attn.v_proj,0.0000006379,0.01000,1.790
9,self_attn.k_proj,0.0000043032,0.01000,1.797
9,self_attn.q_proj,0.0000104725,0.01000,1.798
9,self_attn.o_proj,0.0000001270,0.01000,0.570
9,mlp.gate_proj,0.0000138218,0.01000,1.006
9,mlp.up_proj,0.0000081519,0.01000,1.043
9,mlp.down_proj,0.0000002536,0.01000,2.288
10,self_attn.k_proj,0.0000052919,0.01000,1.780
10,self_attn.v_proj,0.0000007385,0.01000,1.800
10,self_attn.q_proj,0.0000109618,0.01000,1.802
10,self_attn.o_proj,0.0000000904,0.01000,0.547
10,mlp.gate_proj,0.0000157324,0.01000,1.032
10,mlp.up_proj,0.0000096783,0.01000,1.032
10,mlp.down_proj,0.0000003206,0.01000,2.327
11,self_attn.q_proj,0.0000108013,0.01000,1.738
11,self_attn.v_proj,0.0000007318,0.01000,1.768
11,self_attn.k_proj,0.0000063929,0.01000,1.784
11,self_attn.o_proj,0.0000000737,0.01000,0.539
11,mlp.up_proj,0.0000107010,0.01000,1.055
11,mlp.gate_proj,0.0000169148,0.01000,1.092
11,mlp.down_proj,0.0000003495,0.01000,2.352
12,self_attn.q_proj,0.0000109646,0.01000,1.752
12,self_attn.v_proj,0.0000007339,0.01000,1.779
12,self_attn.k_proj,0.0000064957,0.01000,1.798
12,self_attn.o_proj,0.0000000729,0.01000,0.566
12,mlp.gate_proj,0.0000168436,0.01000,0.998
12,mlp.up_proj,0.0000114548,0.01000,1.038
12,mlp.down_proj,0.0000004103,0.01000,2.287
13,self_attn.k_proj,0.0000063991,0.01000,1.769
13,self_attn.v_proj,0.0000012767,0.01000,1.793
13,self_attn.q_proj,0.0000125225,0.01000,1.799
13,self_attn.o_proj,0.0000000978,0.01000,0.575
13,mlp.up_proj,0.0000132768,0.01000,1.011
13,mlp.gate_proj,0.0000178807,0.01000,1.046
13,mlp.down_proj,0.0000005930,0.01000,2.381
14,self_attn.k_proj,0.0000070746,0.01000,1.775
14,self_attn.q_proj,0.0000131299,0.01000,1.788
14,self_attn.v_proj,0.0000028588,0.01000,1.800
14,self_attn.o_proj,0.0000002135,0.01000,0.544
14,mlp.gate_proj,0.0000218060,0.01000,1.026
14,mlp.up_proj,0.0000150468,0.01000,1.066
14,mlp.down_proj,0.0000007873,0.01000,2.272
15,self_attn.v_proj,0.0000028172,0.01000,1.771
15,self_attn.k_proj,0.0000067497,0.01000,1.777
15,self_attn.q_proj,0.0000119015,0.01000,1.797
15,self_attn.o_proj,0.0000008570,0.01000,0.532
15,mlp.gate_proj,0.0000244674,0.01000,1.043
15,mlp.up_proj,0.0000183277,0.01000,1.079
15,mlp.down_proj,0.0000018268,0.01000,2.394
|