File size: 6,025 Bytes
c2631e3 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 | layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.01193101,0.01000,0.799
0,self_attn.v_proj,0.00204742,0.01000,0.763
0,self_attn.q_proj,0.01151794,0.01000,0.777
0,self_attn.out_proj,0.00000999,0.01000,0.782
0,fc1,0.07026074,0.01000,0.789
0,fc2,0.00008938,0.01000,3.565
1,self_attn.k_proj,0.02562066,0.01000,0.818
1,self_attn.v_proj,0.00352371,0.01000,0.791
1,self_attn.q_proj,0.02841486,0.01000,0.810
1,self_attn.out_proj,0.00000083,0.01000,0.792
1,fc1,0.09863914,0.01000,0.803
1,fc2,0.00007210,0.01000,3.472
2,self_attn.k_proj,0.03177334,0.01000,0.804
2,self_attn.v_proj,0.00599721,0.01000,0.785
2,self_attn.q_proj,0.03215131,0.01000,0.795
2,self_attn.out_proj,0.00000170,0.01000,0.800
2,fc1,0.09993766,0.01000,0.805
2,fc2,0.00004340,0.01000,3.459
3,self_attn.k_proj,0.03017306,0.01000,0.800
3,self_attn.v_proj,0.00719706,0.01000,0.830
3,self_attn.q_proj,0.03313547,0.01000,0.796
3,self_attn.out_proj,0.00000379,0.01000,0.786
3,fc1,0.08670861,0.01000,0.824
3,fc2,0.00006025,0.01000,3.493
4,self_attn.k_proj,0.03740298,0.01000,0.821
4,self_attn.v_proj,0.00782993,0.01000,0.788
4,self_attn.q_proj,0.04022481,0.01000,0.796
4,self_attn.out_proj,0.00001067,0.01000,0.790
4,fc1,0.08439302,0.01000,0.812
4,fc2,0.00006476,0.01000,3.526
5,self_attn.k_proj,0.03982919,0.01000,0.839
5,self_attn.v_proj,0.00910398,0.01000,0.828
5,self_attn.q_proj,0.04431270,0.01000,0.832
5,self_attn.out_proj,0.00001022,0.01000,0.789
5,fc1,0.08609112,0.01000,0.800
5,fc2,0.00007743,0.01000,3.511
6,self_attn.k_proj,0.05780744,0.01000,0.851
6,self_attn.v_proj,0.01026140,0.01000,0.798
6,self_attn.q_proj,0.05580460,0.01000,0.802
6,self_attn.out_proj,0.00002657,0.01000,0.786
6,fc1,0.09354434,0.01000,0.804
6,fc2,0.00010447,0.01000,3.530
7,self_attn.k_proj,0.05912374,0.01000,0.805
7,self_attn.v_proj,0.01100888,0.01000,0.798
7,self_attn.q_proj,0.05362352,0.01000,0.791
7,self_attn.out_proj,0.00003713,0.01000,0.786
7,fc1,0.10488027,0.01000,0.802
7,fc2,0.00015386,0.01000,3.488
8,self_attn.k_proj,0.06267314,0.01000,0.811
8,self_attn.v_proj,0.01142946,0.01000,0.791
8,self_attn.q_proj,0.05168283,0.01000,0.808
8,self_attn.out_proj,0.00004905,0.01000,0.800
8,fc1,0.11440692,0.01000,0.800
8,fc2,0.00021658,0.01000,3.472
9,self_attn.k_proj,0.06292796,0.01000,0.807
9,self_attn.v_proj,0.01188188,0.01000,0.810
9,self_attn.q_proj,0.05260397,0.01000,0.823
9,self_attn.out_proj,0.00007306,0.01000,0.800
9,fc1,0.11874346,0.01000,0.803
9,fc2,0.00030846,0.01000,3.499
10,self_attn.k_proj,0.05970397,0.01000,0.839
10,self_attn.v_proj,0.01365755,0.01000,0.782
10,self_attn.q_proj,0.04870038,0.01000,0.787
10,self_attn.out_proj,0.00009548,0.01000,0.808
10,fc1,0.12180368,0.01000,0.807
10,fc2,0.00049581,0.01000,3.483
11,self_attn.k_proj,0.05712467,0.01000,0.802
11,self_attn.v_proj,0.01546244,0.01000,0.805
11,self_attn.q_proj,0.04620140,0.01000,0.799
11,self_attn.out_proj,0.00013356,0.01000,0.806
11,fc1,0.12510935,0.01000,0.807
11,fc2,0.00070838,0.01000,3.464
12,self_attn.k_proj,0.06126989,0.01000,0.794
12,self_attn.v_proj,0.01617533,0.01000,0.797
12,self_attn.q_proj,0.04634463,0.01000,0.800
12,self_attn.out_proj,0.00022420,0.01000,0.798
12,fc1,0.12253537,0.01000,0.815
12,fc2,0.00098394,0.01000,3.459
13,self_attn.k_proj,0.06390332,0.01000,0.808
13,self_attn.v_proj,0.01698245,0.01000,0.797
13,self_attn.q_proj,0.04609602,0.01000,0.802
13,self_attn.out_proj,0.00024484,0.01000,0.808
13,fc1,0.12942690,0.01000,0.801
13,fc2,0.00133922,0.01000,3.477
14,self_attn.k_proj,0.05804610,0.01000,0.815
14,self_attn.v_proj,0.02069202,0.01000,0.790
14,self_attn.q_proj,0.04335492,0.01000,0.794
14,self_attn.out_proj,0.00028324,0.01000,0.790
14,fc1,0.13748725,0.01000,0.824
14,fc2,0.00186989,0.01000,3.495
15,self_attn.k_proj,0.05209177,0.01000,0.802
15,self_attn.v_proj,0.02601032,0.01000,0.798
15,self_attn.q_proj,0.04298635,0.01000,0.793
15,self_attn.out_proj,0.00026579,0.01000,0.791
15,fc1,0.14352571,0.01000,0.799
15,fc2,0.00233943,0.01000,3.489
16,self_attn.k_proj,0.05171879,0.01000,0.791
16,self_attn.v_proj,0.02765215,0.01000,0.792
16,self_attn.q_proj,0.03754202,0.01000,0.825
16,self_attn.out_proj,0.00039184,0.01000,0.804
16,fc1,0.15427885,0.01000,0.823
16,fc2,0.00305063,0.01000,3.491
17,self_attn.k_proj,0.05001822,0.01000,0.794
17,self_attn.v_proj,0.02992602,0.01000,0.803
17,self_attn.q_proj,0.03717646,0.01000,0.832
17,self_attn.out_proj,0.00044749,0.01000,0.800
17,fc1,0.16721998,0.01000,0.803
17,fc2,0.00387488,0.01000,3.446
18,self_attn.k_proj,0.04496108,0.01000,0.804
18,self_attn.v_proj,0.03398469,0.01000,0.799
18,self_attn.q_proj,0.03570567,0.01000,0.800
18,self_attn.out_proj,0.00052166,0.01000,0.798
18,fc1,0.17648941,0.01000,0.796
18,fc2,0.00477775,0.01000,3.467
19,self_attn.k_proj,0.04617426,0.01000,0.778
19,self_attn.v_proj,0.04399054,0.01000,0.786
19,self_attn.q_proj,0.03593020,0.01000,0.793
19,self_attn.out_proj,0.00082788,0.01000,0.788
19,fc1,0.19112378,0.01000,0.797
19,fc2,0.00600311,0.01000,3.433
20,self_attn.k_proj,0.04817279,0.01000,0.812
20,self_attn.v_proj,0.05046446,0.01000,0.795
20,self_attn.q_proj,0.03522086,0.01000,0.796
20,self_attn.out_proj,0.00096899,0.01000,0.772
20,fc1,0.20045713,0.01000,0.786
20,fc2,0.00774820,0.01000,3.401
21,self_attn.k_proj,0.04507433,0.01000,0.818
21,self_attn.v_proj,0.05300805,0.01000,0.789
21,self_attn.q_proj,0.03941233,0.01000,0.782
21,self_attn.out_proj,0.00082373,0.01000,0.787
21,fc1,0.20499779,0.01000,0.789
21,fc2,0.00907014,0.01000,3.453
22,self_attn.k_proj,0.04758519,0.01000,0.795
22,self_attn.v_proj,0.06150986,0.01000,0.796
22,self_attn.q_proj,0.04965690,0.01000,0.795
22,self_attn.out_proj,0.00088354,0.01000,0.781
22,fc1,0.20536900,0.01000,0.840
22,fc2,0.00947218,0.01000,3.441
23,self_attn.k_proj,0.06900742,0.01000,0.810
23,self_attn.v_proj,0.04522258,0.01000,0.802
23,self_attn.q_proj,0.11501978,0.01000,0.806
23,self_attn.out_proj,0.00240127,0.01000,0.796
23,fc1,0.19866552,0.01000,0.803
23,fc2,0.00691203,0.01000,3.478
|