| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000002985,0.01000,4.947 | |
| 0,self_attn.v_proj,0.0000000628,0.01000,1.884 | |
| 0,self_attn.q_proj,0.0000008087,0.01000,1.865 | |
| 0,self_attn.o_proj,0.0000009411,0.01000,1.889 | |
| 0,mlp.up_proj,0.0000003857,0.01000,1.936 | |
| 0,mlp.gate_proj,0.0000004343,0.01000,1.944 | |
| 0,mlp.down_proj,0.0000008139,0.01000,6.115 | |
| 1,self_attn.k_proj,0.0000000138,0.01000,1.904 | |
| 1,self_attn.v_proj,0.0000000049,0.01000,1.858 | |
| 1,self_attn.q_proj,0.0000000554,0.01000,1.897 | |
| 1,self_attn.o_proj,0.0000000136,0.01000,1.902 | |
| 1,mlp.up_proj,0.0000018059,0.01000,1.992 | |
| 1,mlp.gate_proj,0.0000048088,0.01000,1.986 | |
| 1,mlp.down_proj,0.0000000962,0.01000,6.180 | |
| 2,self_attn.k_proj,0.0000000607,0.01000,1.859 | |
| 2,self_attn.v_proj,0.0000000150,0.01000,1.884 | |
| 2,self_attn.q_proj,0.0000001718,0.01000,1.890 | |
| 2,self_attn.o_proj,0.0000000996,0.01000,1.952 | |
| 2,mlp.up_proj,0.0000043320,0.01000,2.028 | |
| 2,mlp.gate_proj,0.0000081417,0.01000,1.956 | |
| 2,mlp.down_proj,0.0000004419,0.01000,6.144 | |
| 3,self_attn.k_proj,0.0000003379,0.01000,1.877 | |
| 3,self_attn.v_proj,0.0000000693,0.01000,1.870 | |
| 3,self_attn.q_proj,0.0000009042,0.01000,1.892 | |
| 3,self_attn.o_proj,0.0000002491,0.01000,1.931 | |
| 3,mlp.up_proj,0.0000050404,0.01000,1.994 | |
| 3,mlp.gate_proj,0.0000106641,0.01000,1.996 | |
| 3,mlp.down_proj,0.0000007892,0.01000,6.105 | |
| 4,self_attn.k_proj,0.0000003962,0.01000,1.884 | |
| 4,self_attn.v_proj,0.0000001156,0.01000,1.823 | |
| 4,self_attn.q_proj,0.0000010681,0.01000,1.846 | |
| 4,self_attn.o_proj,0.0000004779,0.01000,1.910 | |
| 4,mlp.up_proj,0.0000107675,0.01000,2.053 | |
| 4,mlp.gate_proj,0.0000199058,0.01000,2.028 | |
| 4,mlp.down_proj,0.0013483506,0.01000,6.148 | |
| 5,self_attn.k_proj,0.0000013836,0.01000,1.869 | |
| 5,self_attn.v_proj,0.0000005688,0.01000,1.827 | |
| 5,self_attn.q_proj,0.0000044049,0.01000,1.926 | |
| 5,self_attn.o_proj,0.0000007381,0.01000,1.906 | |
| 5,mlp.up_proj,0.0000180994,0.01000,1.995 | |
| 5,mlp.gate_proj,0.0000349824,0.01000,1.990 | |
| 5,mlp.down_proj,0.0000037041,0.01000,6.229 | |
| 6,self_attn.k_proj,0.0000015295,0.01000,1.891 | |
| 6,self_attn.v_proj,0.0000008116,0.01000,1.841 | |
| 6,self_attn.q_proj,0.0000052489,0.01000,1.904 | |
| 6,self_attn.o_proj,0.0000006595,0.01000,1.914 | |
| 6,mlp.up_proj,0.0000294027,0.01000,2.036 | |
| 6,mlp.gate_proj,0.0000543190,0.01000,2.000 | |
| 6,mlp.down_proj,0.0000033944,0.01000,6.185 | |
| 7,self_attn.k_proj,0.0000022324,0.01000,1.848 | |
| 7,self_attn.v_proj,0.0000012807,0.01000,1.836 | |
| 7,self_attn.q_proj,0.0000077740,0.01000,1.898 | |
| 7,self_attn.o_proj,0.0000006588,0.01000,1.889 | |
| 7,mlp.up_proj,0.0000377604,0.01000,2.007 | |
| 7,mlp.gate_proj,0.0000714821,0.01000,2.013 | |
| 7,mlp.down_proj,0.0000025652,0.01000,6.107 | |
| 8,self_attn.k_proj,0.0000024254,0.01000,1.863 | |
| 8,self_attn.v_proj,0.0000010471,0.01000,1.841 | |
| 8,self_attn.q_proj,0.0000081145,0.01000,1.936 | |
| 8,self_attn.o_proj,0.0000005655,0.01000,1.886 | |
| 8,mlp.up_proj,0.0000263257,0.01000,2.090 | |
| 8,mlp.gate_proj,0.0000475203,0.01000,2.009 | |
| 8,mlp.down_proj,0.0000034082,0.01000,6.117 | |
| 9,self_attn.k_proj,0.0000022917,0.01000,1.865 | |
| 9,self_attn.v_proj,0.0000013029,0.01000,1.832 | |
| 9,self_attn.q_proj,0.0000077636,0.01000,1.919 | |
| 9,self_attn.o_proj,0.0000010365,0.01000,1.908 | |
| 9,mlp.up_proj,0.0000193074,0.01000,1.997 | |
| 9,mlp.gate_proj,0.0000211020,0.01000,2.014 | |
| 9,mlp.down_proj,0.0000048219,0.01000,6.151 | |
| 10,self_attn.k_proj,0.0000034324,0.01000,1.867 | |
| 10,self_attn.v_proj,0.0000019137,0.01000,1.831 | |
| 10,self_attn.q_proj,0.0000121056,0.01000,1.897 | |
| 10,self_attn.o_proj,0.0000010023,0.01000,1.873 | |
| 10,mlp.up_proj,0.0000224903,0.01000,2.013 | |
| 10,mlp.gate_proj,0.0000246599,0.01000,2.011 | |
| 10,mlp.down_proj,0.0000059849,0.01000,6.103 | |
| 11,self_attn.k_proj,0.0000025495,0.01000,1.908 | |
| 11,self_attn.v_proj,0.0000012462,0.01000,1.865 | |
| 11,self_attn.q_proj,0.0000090048,0.01000,1.923 | |
| 11,self_attn.o_proj,0.0000014718,0.01000,1.924 | |
| 11,mlp.up_proj,0.0000258469,0.01000,2.027 | |
| 11,mlp.gate_proj,0.0000321958,0.01000,1.986 | |
| 11,mlp.down_proj,0.0000051555,0.01000,6.087 | |
| 12,self_attn.k_proj,0.0000031215,0.01000,1.847 | |
| 12,self_attn.v_proj,0.0000014327,0.01000,1.841 | |
| 12,self_attn.q_proj,0.0000111406,0.01000,1.893 | |
| 12,self_attn.o_proj,0.0000017573,0.01000,1.957 | |
| 12,mlp.up_proj,0.0000284193,0.01000,2.017 | |
| 12,mlp.gate_proj,0.0000301645,0.01000,1.993 | |
| 12,mlp.down_proj,0.0000064959,0.01000,6.090 | |
| 13,self_attn.k_proj,0.0000034285,0.01000,1.923 | |
| 13,self_attn.v_proj,0.0000017783,0.01000,1.831 | |
| 13,self_attn.q_proj,0.0000119425,0.01000,1.911 | |
| 13,self_attn.o_proj,0.0000020312,0.01000,1.861 | |
| 13,mlp.up_proj,0.0000325586,0.01000,2.011 | |
| 13,mlp.gate_proj,0.0000345637,0.01000,1.978 | |
| 13,mlp.down_proj,0.0000076320,0.01000,6.090 | |
| 14,self_attn.k_proj,0.0000042219,0.01000,1.872 | |
| 14,self_attn.v_proj,0.0000019629,0.01000,1.827 | |
| 14,self_attn.q_proj,0.0000144176,0.01000,1.895 | |
| 14,self_attn.o_proj,0.0000020731,0.01000,1.931 | |
| 14,mlp.up_proj,0.0000335783,0.01000,2.019 | |
| 14,mlp.gate_proj,0.0000354549,0.01000,2.017 | |
| 14,mlp.down_proj,0.0000079941,0.01000,6.158 | |
| 15,self_attn.k_proj,0.0000036243,0.01000,1.894 | |
| 15,self_attn.v_proj,0.0000022559,0.01000,1.827 | |
| 15,self_attn.q_proj,0.0000129040,0.01000,1.897 | |
| 15,self_attn.o_proj,0.0000027518,0.01000,1.912 | |
| 15,mlp.up_proj,0.0000350510,0.01000,2.121 | |
| 15,mlp.gate_proj,0.0000385737,0.01000,1.996 | |
| 15,mlp.down_proj,0.0000085556,0.01000,6.094 | |
| 16,self_attn.k_proj,0.0000036654,0.01000,1.849 | |
| 16,self_attn.v_proj,0.0000015336,0.01000,1.822 | |
| 16,self_attn.q_proj,0.0000115880,0.01000,1.872 | |
| 16,self_attn.o_proj,0.0000024392,0.01000,1.921 | |
| 16,mlp.up_proj,0.0000326376,0.01000,2.085 | |
| 16,mlp.gate_proj,0.0000331992,0.01000,2.003 | |
| 16,mlp.down_proj,0.0000084625,0.01000,6.173 | |
| 17,self_attn.k_proj,0.0000040579,0.01000,1.885 | |
| 17,self_attn.v_proj,0.0000018465,0.01000,1.861 | |
| 17,self_attn.q_proj,0.0000138158,0.01000,1.906 | |
| 17,self_attn.o_proj,0.0000025808,0.01000,1.932 | |
| 17,mlp.up_proj,0.0000322729,0.01000,2.001 | |
| 17,mlp.gate_proj,0.0000317870,0.01000,1.997 | |
| 17,mlp.down_proj,0.0000080485,0.01000,6.129 | |
| 18,self_attn.k_proj,0.0000039598,0.01000,1.839 | |
| 18,self_attn.v_proj,0.0000020382,0.01000,1.798 | |
| 18,self_attn.q_proj,0.0000137095,0.01000,1.895 | |
| 18,self_attn.o_proj,0.0000029167,0.01000,1.892 | |
| 18,mlp.up_proj,0.0000323423,0.01000,1.998 | |
| 18,mlp.gate_proj,0.0000308571,0.01000,2.011 | |
| 18,mlp.down_proj,0.0000081186,0.01000,6.181 | |
| 19,self_attn.k_proj,0.0000043350,0.01000,1.867 | |
| 19,self_attn.v_proj,0.0000020963,0.01000,1.811 | |
| 19,self_attn.q_proj,0.0000163849,0.01000,1.886 | |
| 19,self_attn.o_proj,0.0000022194,0.01000,1.976 | |
| 19,mlp.up_proj,0.0000333286,0.01000,2.074 | |
| 19,mlp.gate_proj,0.0000317924,0.01000,2.042 | |
| 19,mlp.down_proj,0.0000083289,0.01000,6.124 | |
| 20,self_attn.k_proj,0.0000045548,0.01000,1.827 | |
| 20,self_attn.v_proj,0.0000019402,0.01000,1.863 | |
| 20,self_attn.q_proj,0.0000157211,0.01000,1.926 | |
| 20,self_attn.o_proj,0.0000029912,0.01000,1.890 | |
| 20,mlp.up_proj,0.0000323250,0.01000,2.020 | |
| 20,mlp.gate_proj,0.0000292523,0.01000,1.999 | |
| 20,mlp.down_proj,0.0000087532,0.01000,6.119 | |
| 21,self_attn.k_proj,0.0000042023,0.01000,1.894 | |
| 21,self_attn.v_proj,0.0000019321,0.01000,1.853 | |
| 21,self_attn.q_proj,0.0000144628,0.01000,1.918 | |
| 21,self_attn.o_proj,0.0000030416,0.01000,1.891 | |
| 21,mlp.up_proj,0.0000326811,0.01000,1.994 | |
| 21,mlp.gate_proj,0.0000293238,0.01000,1.979 | |
| 21,mlp.down_proj,0.0000085412,0.01000,6.151 | |
| 22,self_attn.k_proj,0.0000046789,0.01000,1.887 | |
| 22,self_attn.v_proj,0.0000028668,0.01000,1.833 | |
| 22,self_attn.q_proj,0.0000161835,0.01000,1.896 | |
| 22,self_attn.o_proj,0.0000038789,0.01000,1.901 | |
| 22,mlp.up_proj,0.0000331632,0.01000,2.071 | |
| 22,mlp.gate_proj,0.0000295798,0.01000,1.978 | |
| 22,mlp.down_proj,0.0000096156,0.01000,6.178 | |
| 23,self_attn.k_proj,0.0000043162,0.01000,1.860 | |
| 23,self_attn.v_proj,0.0000028849,0.01000,1.833 | |
| 23,self_attn.q_proj,0.0000160021,0.01000,1.861 | |
| 23,self_attn.o_proj,0.0000037945,0.01000,1.923 | |
| 23,mlp.up_proj,0.0000337720,0.01000,2.003 | |
| 23,mlp.gate_proj,0.0000317463,0.01000,2.011 | |
| 23,mlp.down_proj,0.0000093671,0.01000,6.194 | |
| 24,self_attn.k_proj,0.0000057187,0.01000,1.942 | |
| 24,self_attn.v_proj,0.0000024407,0.01000,1.866 | |
| 24,self_attn.q_proj,0.0000181873,0.01000,1.904 | |
| 24,self_attn.o_proj,0.0000041032,0.01000,1.924 | |
| 24,mlp.up_proj,0.0000324691,0.01000,2.000 | |
| 24,mlp.gate_proj,0.0000301167,0.01000,1.985 | |
| 24,mlp.down_proj,0.0000084492,0.01000,6.136 | |
| 25,self_attn.k_proj,0.0000055621,0.01000,1.846 | |
| 25,self_attn.v_proj,0.0000031424,0.01000,1.823 | |
| 25,self_attn.q_proj,0.0000198023,0.01000,1.922 | |
| 25,self_attn.o_proj,0.0000028802,0.01000,1.885 | |
| 25,mlp.up_proj,0.0000330885,0.01000,2.068 | |
| 25,mlp.gate_proj,0.0000296588,0.01000,2.031 | |
| 25,mlp.down_proj,0.0000089875,0.01000,6.062 | |
| 26,self_attn.k_proj,0.0000050286,0.01000,1.858 | |
| 26,self_attn.v_proj,0.0000021552,0.01000,1.866 | |
| 26,self_attn.q_proj,0.0000176642,0.01000,1.899 | |
| 26,self_attn.o_proj,0.0000031027,0.01000,1.904 | |
| 26,mlp.up_proj,0.0000356900,0.01000,2.014 | |
| 26,mlp.gate_proj,0.0000308428,0.01000,1.988 | |
| 26,mlp.down_proj,0.0000103464,0.01000,6.112 | |
| 27,self_attn.k_proj,0.0000050559,0.01000,1.826 | |
| 27,self_attn.v_proj,0.0000026083,0.01000,1.817 | |
| 27,self_attn.q_proj,0.0000170910,0.01000,1.898 | |
| 27,self_attn.o_proj,0.0000044997,0.01000,1.891 | |
| 27,mlp.up_proj,0.0000373241,0.01000,2.002 | |
| 27,mlp.gate_proj,0.0000323265,0.01000,2.026 | |
| 27,mlp.down_proj,0.0000123207,0.01000,6.172 | |
| 28,self_attn.k_proj,0.0000042150,0.01000,1.883 | |
| 28,self_attn.v_proj,0.0000037593,0.01000,1.861 | |
| 28,self_attn.q_proj,0.0000171301,0.01000,1.885 | |
| 28,self_attn.o_proj,0.0000054424,0.01000,1.916 | |
| 28,mlp.up_proj,0.0000382802,0.01000,1.990 | |
| 28,mlp.gate_proj,0.0000329041,0.01000,2.059 | |
| 28,mlp.down_proj,0.0000136056,0.01000,6.099 | |
| 29,self_attn.k_proj,0.0000055420,0.01000,1.847 | |
| 29,self_attn.v_proj,0.0000036558,0.01000,1.942 | |
| 29,self_attn.q_proj,0.0000196112,0.01000,1.991 | |
| 29,self_attn.o_proj,0.0000046135,0.01000,1.879 | |
| 29,mlp.up_proj,0.0000391342,0.01000,2.033 | |
| 29,mlp.gate_proj,0.0000337284,0.01000,1.968 | |
| 29,mlp.down_proj,0.0000148448,0.01000,6.136 | |
| 30,self_attn.k_proj,0.0000047346,0.01000,1.847 | |
| 30,self_attn.v_proj,0.0000041514,0.01000,1.863 | |
| 30,self_attn.q_proj,0.0000184229,0.01000,1.959 | |
| 30,self_attn.o_proj,0.0000064813,0.01000,1.855 | |
| 30,mlp.up_proj,0.0000411291,0.01000,2.034 | |
| 30,mlp.gate_proj,0.0000354981,0.01000,2.003 | |
| 30,mlp.down_proj,0.0000166990,0.01000,6.158 | |
| 31,self_attn.k_proj,0.0000048687,0.01000,1.867 | |
| 31,self_attn.v_proj,0.0000040193,0.01000,1.842 | |
| 31,self_attn.q_proj,0.0000189473,0.01000,1.897 | |
| 31,self_attn.o_proj,0.0000054662,0.01000,1.928 | |
| 31,mlp.up_proj,0.0000457638,0.01000,2.001 | |
| 31,mlp.gate_proj,0.0000403368,0.01000,2.053 | |
| 31,mlp.down_proj,0.0000203712,0.01000,6.115 | |
| 32,self_attn.k_proj,0.0000053250,0.01000,1.836 | |
| 32,self_attn.v_proj,0.0000053774,0.01000,1.829 | |
| 32,self_attn.q_proj,0.0000208265,0.01000,1.948 | |
| 32,self_attn.o_proj,0.0000054974,0.01000,1.923 | |
| 32,mlp.up_proj,0.0000489943,0.01000,2.010 | |
| 32,mlp.gate_proj,0.0000443471,0.01000,2.022 | |
| 32,mlp.down_proj,0.0000236334,0.01000,6.119 | |
| 33,self_attn.k_proj,0.0000055528,0.01000,1.860 | |
| 33,self_attn.v_proj,0.0000053279,0.01000,1.855 | |
| 33,self_attn.q_proj,0.0000225135,0.01000,1.882 | |
| 33,self_attn.o_proj,0.0000065416,0.01000,1.911 | |
| 33,mlp.up_proj,0.0000581524,0.01000,1.989 | |
| 33,mlp.gate_proj,0.0000532374,0.01000,1.992 | |
| 33,mlp.down_proj,0.0000341816,0.01000,6.194 | |
| 34,self_attn.k_proj,0.0000057969,0.01000,1.865 | |
| 34,self_attn.v_proj,0.0000065100,0.01000,1.820 | |
| 34,self_attn.q_proj,0.0000247060,0.01000,1.933 | |
| 34,self_attn.o_proj,0.0000064140,0.01000,1.974 | |
| 34,mlp.up_proj,0.0000676059,0.01000,1.996 | |
| 34,mlp.gate_proj,0.0000639034,0.01000,1.969 | |
| 34,mlp.down_proj,0.0000421207,0.01000,6.114 | |
| 35,self_attn.k_proj,0.0000056806,0.01000,1.843 | |
| 35,self_attn.v_proj,0.0000058037,0.01000,1.859 | |
| 35,self_attn.q_proj,0.0000227509,0.01000,1.864 | |
| 35,self_attn.o_proj,0.0000107215,0.01000,1.953 | |
| 35,mlp.up_proj,0.0000773738,0.01000,2.075 | |
| 35,mlp.gate_proj,0.0000748045,0.01000,2.003 | |
| 35,mlp.down_proj,0.0000531376,0.01000,6.151 | |
| 36,self_attn.k_proj,0.0000064778,0.01000,1.826 | |
| 36,self_attn.v_proj,0.0000105387,0.01000,1.820 | |
| 36,self_attn.q_proj,0.0000284083,0.01000,1.898 | |
| 36,self_attn.o_proj,0.0000097221,0.01000,1.959 | |
| 36,mlp.up_proj,0.0000858965,0.01000,2.012 | |
| 36,mlp.gate_proj,0.0000823549,0.01000,2.042 | |
| 36,mlp.down_proj,0.0000657707,0.01000,6.164 | |
| 37,self_attn.k_proj,0.0000074679,0.01000,1.836 | |
| 37,self_attn.v_proj,0.0000103437,0.01000,1.870 | |
| 37,self_attn.q_proj,0.0000301686,0.01000,1.843 | |
| 37,self_attn.o_proj,0.0000103363,0.01000,1.949 | |
| 37,mlp.up_proj,0.0000963696,0.01000,2.029 | |
| 37,mlp.gate_proj,0.0000927627,0.01000,1.995 | |
| 37,mlp.down_proj,0.0000759659,0.01000,6.172 | |
| 38,self_attn.k_proj,0.0000072543,0.01000,1.906 | |
| 38,self_attn.v_proj,0.0000103870,0.01000,1.833 | |
| 38,self_attn.q_proj,0.0000302236,0.01000,1.885 | |
| 38,self_attn.o_proj,0.0000106793,0.01000,1.909 | |
| 38,mlp.up_proj,0.0001080096,0.01000,1.994 | |
| 38,mlp.gate_proj,0.0001029393,0.01000,2.037 | |
| 38,mlp.down_proj,0.0000864311,0.01000,6.118 | |
| 39,self_attn.k_proj,0.0000070753,0.01000,1.848 | |
| 39,self_attn.v_proj,0.0000115101,0.01000,1.855 | |
| 39,self_attn.q_proj,0.0000317167,0.01000,1.926 | |
| 39,self_attn.o_proj,0.0000149693,0.01000,1.908 | |
| 39,mlp.up_proj,0.0001216658,0.01000,2.038 | |
| 39,mlp.gate_proj,0.0001149202,0.01000,2.005 | |
| 39,mlp.down_proj,0.0001039416,0.01000,6.191 | |
| 40,self_attn.k_proj,0.0000081462,0.01000,1.824 | |
| 40,self_attn.v_proj,0.0000157852,0.01000,1.910 | |
| 40,self_attn.q_proj,0.0000353841,0.01000,1.991 | |
| 40,self_attn.o_proj,0.0000151671,0.01000,1.913 | |
| 40,mlp.up_proj,0.0001326770,0.01000,2.002 | |
| 40,mlp.gate_proj,0.0001247391,0.01000,2.012 | |
| 40,mlp.down_proj,0.0001193831,0.01000,6.104 | |
| 41,self_attn.k_proj,0.0000079063,0.01000,1.881 | |
| 41,self_attn.v_proj,0.0000165749,0.01000,1.930 | |
| 41,self_attn.q_proj,0.0000366510,0.01000,1.896 | |
| 41,self_attn.o_proj,0.0000124038,0.01000,1.877 | |
| 41,mlp.up_proj,0.0001447803,0.01000,1.999 | |
| 41,mlp.gate_proj,0.0001340893,0.01000,1.963 | |
| 41,mlp.down_proj,0.0001349494,0.01000,6.061 | |
| 42,self_attn.k_proj,0.0000083146,0.01000,1.833 | |
| 42,self_attn.v_proj,0.0000181338,0.01000,1.793 | |
| 42,self_attn.q_proj,0.0000357798,0.01000,1.855 | |
| 42,self_attn.o_proj,0.0000141514,0.01000,1.914 | |
| 42,mlp.up_proj,0.0001559160,0.01000,1.990 | |
| 42,mlp.gate_proj,0.0001425551,0.01000,1.997 | |
| 42,mlp.down_proj,0.0001580665,0.01000,6.099 | |
| 43,self_attn.k_proj,0.0000083956,0.01000,1.822 | |
| 43,self_attn.v_proj,0.0000256210,0.01000,1.813 | |
| 43,self_attn.q_proj,0.0000399949,0.01000,1.861 | |
| 43,self_attn.o_proj,0.0000247247,0.01000,1.883 | |
| 43,mlp.up_proj,0.0001706939,0.01000,2.020 | |
| 43,mlp.gate_proj,0.0001531956,0.01000,2.037 | |
| 43,mlp.down_proj,0.0001867778,0.01000,6.179 | |
| 44,self_attn.k_proj,0.0000076330,0.01000,1.852 | |
| 44,self_attn.v_proj,0.0000281914,0.01000,1.820 | |
| 44,self_attn.q_proj,0.0000391793,0.01000,1.889 | |
| 44,self_attn.o_proj,0.0000360502,0.01000,1.884 | |
| 44,mlp.up_proj,0.0001831046,0.01000,1.963 | |
| 44,mlp.gate_proj,0.0001616602,0.01000,1.966 | |
| 44,mlp.down_proj,0.0002535868,0.01000,6.108 | |
| 45,self_attn.k_proj,0.0000079784,0.01000,1.892 | |
| 45,self_attn.v_proj,0.0000340295,0.01000,1.838 | |
| 45,self_attn.q_proj,0.0000422606,0.01000,1.895 | |
| 45,self_attn.o_proj,0.0000337677,0.01000,1.944 | |
| 45,mlp.up_proj,0.0001918452,0.01000,1.990 | |
| 45,mlp.gate_proj,0.0001717587,0.01000,1.985 | |
| 45,mlp.down_proj,0.0002833572,0.01000,6.189 | |
| 46,self_attn.k_proj,0.0000071048,0.01000,1.838 | |
| 46,self_attn.v_proj,0.0000363993,0.01000,1.838 | |
| 46,self_attn.q_proj,0.0000375253,0.01000,1.876 | |
| 46,self_attn.o_proj,0.0000640068,0.01000,1.919 | |
| 46,mlp.up_proj,0.0001911036,0.01000,2.009 | |
| 46,mlp.gate_proj,0.0001784168,0.01000,2.081 | |
| 46,mlp.down_proj,0.0004206370,0.01000,6.225 | |
| 47,self_attn.k_proj,0.0000061165,0.01000,1.837 | |
| 47,self_attn.v_proj,0.0000228788,0.01000,1.920 | |
| 47,self_attn.q_proj,0.0000279219,0.01000,1.940 | |
| 47,self_attn.o_proj,0.0000288922,0.01000,1.906 | |
| 47,mlp.up_proj,0.0002043838,0.01000,2.035 | |
| 47,mlp.gate_proj,0.0001966780,0.01000,2.033 | |
| 47,mlp.down_proj,0.0006320129,0.01000,6.199 | |