| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000074878,0.05000,5.659 | |
| 0,self_attn.q_proj,0.0000147233,0.05000,5.662 | |
| 0,self_attn.v_proj,0.0000004164,0.05000,5.716 | |
| 0,self_attn.o_proj,0.0000000188,0.05000,1.023 | |
| 0,mlp.up_proj,0.0000073224,0.05000,2.317 | |
| 0,mlp.gate_proj,0.0000083827,0.05000,2.350 | |
| 0,mlp.down_proj,0.0000001028,0.05000,2.886 | |
| 1,self_attn.k_proj,0.0000103207,0.05000,5.596 | |
| 1,self_attn.q_proj,0.0000175984,0.05000,5.661 | |
| 1,self_attn.v_proj,0.0000011597,0.05000,5.641 | |
| 1,self_attn.o_proj,0.0000000697,0.05000,1.044 | |
| 1,mlp.up_proj,0.0000099559,0.05000,2.788 | |
| 1,mlp.gate_proj,0.0000113476,0.05000,2.853 | |
| 1,mlp.down_proj,0.0000025962,0.05000,3.085 | |
| 2,self_attn.q_proj,0.0000739263,0.05000,5.511 | |
| 2,self_attn.k_proj,0.0000441155,0.05000,5.576 | |
| 2,self_attn.v_proj,0.0000044463,0.05000,5.601 | |
| 2,self_attn.o_proj,0.0000000672,0.05000,1.023 | |
| 2,mlp.gate_proj,0.0000187338,0.05000,2.298 | |
| 2,mlp.up_proj,0.0000158255,0.05000,2.314 | |
| 2,mlp.down_proj,0.0000003259,0.05000,3.034 | |
| 3,self_attn.k_proj,0.0000269141,0.05000,4.896 | |
| 3,self_attn.v_proj,0.0000044659,0.05000,4.894 | |
| 3,self_attn.q_proj,0.0000484370,0.05000,4.953 | |
| 3,self_attn.o_proj,0.0000001267,0.05000,1.037 | |
| 3,mlp.gate_proj,0.0000267179,0.05000,2.337 | |
| 3,mlp.up_proj,0.0000199634,0.05000,2.363 | |
| 3,mlp.down_proj,0.0000004599,0.05000,2.975 | |
| 4,self_attn.k_proj,0.0000258326,0.05000,4.882 | |
| 4,self_attn.v_proj,0.0000047591,0.05000,4.884 | |
| 4,self_attn.q_proj,0.0000493107,0.05000,4.944 | |
| 4,self_attn.o_proj,0.0000001978,0.05000,1.044 | |
| 4,mlp.gate_proj,0.0000357187,0.05000,2.398 | |
| 4,mlp.up_proj,0.0000239637,0.05000,2.397 | |
| 4,mlp.down_proj,0.0000006565,0.05000,2.979 | |
| 5,self_attn.k_proj,0.0000427736,0.05000,4.861 | |
| 5,self_attn.q_proj,0.0000706749,0.05000,4.928 | |
| 5,self_attn.v_proj,0.0000049181,0.05000,4.948 | |
| 5,self_attn.o_proj,0.0000002486,0.05000,1.045 | |
| 5,mlp.gate_proj,0.0000385495,0.05000,2.308 | |
| 5,mlp.up_proj,0.0000273058,0.05000,2.328 | |
| 5,mlp.down_proj,0.0000008979,0.05000,3.011 | |
| 6,self_attn.k_proj,0.0000308670,0.05000,4.806 | |
| 6,self_attn.q_proj,0.0000581398,0.05000,4.846 | |
| 6,self_attn.v_proj,0.0000045627,0.05000,4.885 | |
| 6,self_attn.o_proj,0.0000003760,0.05000,1.026 | |
| 6,mlp.up_proj,0.0000291855,0.05000,2.248 | |
| 6,mlp.gate_proj,0.0000411316,0.05000,2.276 | |
| 6,mlp.down_proj,0.0000010291,0.05000,3.053 | |
| 7,self_attn.v_proj,0.0000040204,0.05000,4.955 | |
| 7,self_attn.q_proj,0.0000492176,0.05000,5.028 | |
| 7,self_attn.k_proj,0.0000289958,0.05000,5.047 | |
| 7,self_attn.o_proj,0.0000005308,0.05000,1.029 | |
| 7,mlp.up_proj,0.0000311719,0.05000,2.240 | |
| 7,mlp.gate_proj,0.0000403425,0.05000,2.263 | |
| 7,mlp.down_proj,0.0000011793,0.05000,2.982 | |
| 8,self_attn.q_proj,0.0000629039,0.05000,4.885 | |
| 8,self_attn.v_proj,0.0000050514,0.05000,4.884 | |
| 8,self_attn.k_proj,0.0000379682,0.05000,4.907 | |
| 8,self_attn.o_proj,0.0000006740,0.05000,1.021 | |
| 8,mlp.gate_proj,0.0000429643,0.05000,2.269 | |
| 8,mlp.up_proj,0.0000325408,0.05000,2.289 | |
| 8,mlp.down_proj,0.0000012385,0.05000,2.952 | |
| 9,self_attn.k_proj,0.0000347599,0.05000,4.724 | |
| 9,self_attn.v_proj,0.0000061279,0.05000,4.800 | |
| 9,self_attn.q_proj,0.0000586902,0.05000,4.826 | |
| 9,self_attn.o_proj,0.0000007288,0.05000,1.020 | |
| 9,mlp.up_proj,0.0000325744,0.05000,2.317 | |
| 9,mlp.gate_proj,0.0000417335,0.05000,2.339 | |
| 9,mlp.down_proj,0.0000012440,0.05000,2.978 | |
| 10,self_attn.k_proj,0.0000367776,0.05000,4.779 | |
| 10,self_attn.v_proj,0.0000047437,0.05000,4.837 | |
| 10,self_attn.q_proj,0.0000589483,0.05000,4.863 | |
| 10,self_attn.o_proj,0.0000007045,0.05000,1.006 | |
| 10,mlp.up_proj,0.0000355694,0.05000,2.252 | |
| 10,mlp.gate_proj,0.0000426607,0.05000,2.269 | |
| 10,mlp.down_proj,0.0000014252,0.05000,2.945 | |
| 11,self_attn.v_proj,0.0000056424,0.05000,4.732 | |
| 11,self_attn.k_proj,0.0000276094,0.05000,4.769 | |
| 11,self_attn.q_proj,0.0000490194,0.05000,4.803 | |
| 11,self_attn.o_proj,0.0000008918,0.05000,1.040 | |
| 11,mlp.gate_proj,0.0000447233,0.05000,2.266 | |
| 11,mlp.up_proj,0.0000384965,0.05000,2.282 | |
| 11,mlp.down_proj,0.0000016130,0.05000,2.992 | |
| 12,self_attn.v_proj,0.0000062276,0.05000,4.821 | |
| 12,self_attn.q_proj,0.0000707292,0.05000,4.844 | |
| 12,self_attn.k_proj,0.0000422481,0.05000,4.875 | |
| 12,self_attn.o_proj,0.0000010586,0.05000,1.013 | |
| 12,mlp.up_proj,0.0000412534,0.05000,2.241 | |
| 12,mlp.gate_proj,0.0000475553,0.05000,2.264 | |
| 12,mlp.down_proj,0.0000018156,0.05000,2.954 | |
| 13,self_attn.q_proj,0.0000746849,0.05000,4.776 | |
| 13,self_attn.k_proj,0.0000481807,0.05000,4.811 | |
| 13,self_attn.v_proj,0.0000073153,0.05000,4.843 | |
| 13,self_attn.o_proj,0.0000012458,0.05000,1.019 | |
| 13,mlp.up_proj,0.0000458390,0.05000,2.347 | |
| 13,mlp.gate_proj,0.0000565005,0.05000,2.372 | |
| 13,mlp.down_proj,0.0000024355,0.05000,2.979 | |
| 14,self_attn.k_proj,0.0000378307,0.05000,4.768 | |
| 14,self_attn.q_proj,0.0000819438,0.05000,4.881 | |
| 14,self_attn.v_proj,0.0000085098,0.05000,4.895 | |
| 14,self_attn.o_proj,0.0000014740,0.05000,1.037 | |
| 14,mlp.up_proj,0.0000496886,0.05000,2.248 | |
| 14,mlp.gate_proj,0.0000617393,0.05000,2.267 | |
| 14,mlp.down_proj,0.0000029373,0.05000,2.928 | |
| 15,self_attn.v_proj,0.0000085283,0.05000,4.719 | |
| 15,self_attn.k_proj,0.0000434987,0.05000,4.767 | |
| 15,self_attn.q_proj,0.0000836970,0.05000,4.813 | |
| 15,self_attn.o_proj,0.0000009290,0.05000,1.022 | |
| 15,mlp.gate_proj,0.0000665099,0.05000,2.268 | |
| 15,mlp.up_proj,0.0000498216,0.05000,2.299 | |
| 15,mlp.down_proj,0.0000030499,0.05000,2.931 | |
| 16,self_attn.q_proj,0.0000871859,0.05000,4.742 | |
| 16,self_attn.k_proj,0.0000490420,0.05000,4.803 | |
| 16,self_attn.v_proj,0.0000096564,0.05000,4.838 | |
| 16,self_attn.o_proj,0.0000006811,0.05000,1.031 | |
| 16,mlp.gate_proj,0.0000679251,0.05000,2.348 | |
| 16,mlp.up_proj,0.0000497399,0.05000,2.371 | |
| 16,mlp.down_proj,0.0000029397,0.05000,2.928 | |
| 17,self_attn.q_proj,0.0000832187,0.05000,4.610 | |
| 17,self_attn.v_proj,0.0000093413,0.05000,4.761 | |
| 17,self_attn.k_proj,0.0000452292,0.05000,4.788 | |
| 17,self_attn.o_proj,0.0000006960,0.05000,1.055 | |
| 17,mlp.up_proj,0.0000515798,0.05000,2.270 | |
| 17,mlp.gate_proj,0.0000716405,0.05000,2.285 | |
| 17,mlp.down_proj,0.0000032355,0.05000,2.951 | |
| 18,self_attn.v_proj,0.0000116876,0.05000,4.763 | |
| 18,self_attn.k_proj,0.0000521751,0.05000,4.815 | |
| 18,self_attn.q_proj,0.0000943415,0.05000,4.836 | |
| 18,self_attn.o_proj,0.0000007594,0.05000,1.024 | |
| 18,mlp.gate_proj,0.0000745484,0.05000,2.296 | |
| 18,mlp.up_proj,0.0000550380,0.05000,2.313 | |
| 18,mlp.down_proj,0.0000034218,0.05000,2.943 | |
| 19,self_attn.q_proj,0.0000838091,0.05000,4.770 | |
| 19,self_attn.v_proj,0.0000114893,0.05000,4.822 | |
| 19,self_attn.k_proj,0.0000487867,0.05000,4.842 | |
| 19,self_attn.o_proj,0.0000009830,0.05000,1.065 | |
| 19,mlp.gate_proj,0.0000804051,0.05000,2.317 | |
| 19,mlp.up_proj,0.0000600660,0.05000,2.329 | |
| 19,mlp.down_proj,0.0000042528,0.05000,2.947 | |
| 20,self_attn.q_proj,0.0000873402,0.05000,4.741 | |
| 20,self_attn.v_proj,0.0000137784,0.05000,4.810 | |
| 20,self_attn.k_proj,0.0000528894,0.05000,4.846 | |
| 20,self_attn.o_proj,0.0000007206,0.05000,1.018 | |
| 20,mlp.gate_proj,0.0000781699,0.05000,2.336 | |
| 20,mlp.up_proj,0.0000613666,0.05000,2.355 | |
| 20,mlp.down_proj,0.0000041109,0.05000,2.994 | |
| 21,self_attn.q_proj,0.0000868639,0.05000,4.764 | |
| 21,self_attn.k_proj,0.0000519479,0.05000,4.812 | |
| 21,self_attn.v_proj,0.0000178721,0.05000,4.847 | |
| 21,self_attn.o_proj,0.0000008751,0.05000,1.000 | |
| 21,mlp.up_proj,0.0000650703,0.05000,2.354 | |
| 21,mlp.gate_proj,0.0000835892,0.05000,2.381 | |
| 21,mlp.down_proj,0.0000043956,0.05000,2.923 | |
| 22,self_attn.v_proj,0.0000177718,0.05000,4.708 | |
| 22,self_attn.k_proj,0.0000496925,0.05000,4.778 | |
| 22,self_attn.q_proj,0.0000848907,0.05000,4.811 | |
| 22,self_attn.o_proj,0.0000007073,0.05000,1.012 | |
| 22,mlp.up_proj,0.0000702587,0.05000,2.325 | |
| 22,mlp.gate_proj,0.0000909208,0.05000,2.340 | |
| 22,mlp.down_proj,0.0000049920,0.05000,2.933 | |
| 23,self_attn.v_proj,0.0000174651,0.05000,4.746 | |
| 23,self_attn.q_proj,0.0000855378,0.05000,4.796 | |
| 23,self_attn.k_proj,0.0000534188,0.05000,4.820 | |
| 23,self_attn.o_proj,0.0000011784,0.05000,1.016 | |
| 23,mlp.gate_proj,0.0001065173,0.05000,2.276 | |
| 23,mlp.up_proj,0.0000778496,0.05000,2.298 | |
| 23,mlp.down_proj,0.0000061454,0.05000,2.960 | |
| 24,self_attn.v_proj,0.0000258239,0.05000,4.777 | |
| 24,self_attn.k_proj,0.0000595539,0.05000,4.808 | |
| 24,self_attn.q_proj,0.0000942610,0.05000,4.838 | |
| 24,self_attn.o_proj,0.0000017130,0.05000,1.006 | |
| 24,mlp.up_proj,0.0000840494,0.05000,2.249 | |
| 24,mlp.gate_proj,0.0001173177,0.05000,2.264 | |
| 24,mlp.down_proj,0.0000069910,0.05000,2.990 | |
| 25,self_attn.q_proj,0.0000879538,0.05000,4.745 | |
| 25,self_attn.k_proj,0.0000456781,0.05000,4.820 | |
| 25,self_attn.v_proj,0.0000218952,0.05000,4.851 | |
| 25,self_attn.o_proj,0.0000017481,0.05000,1.007 | |
| 25,mlp.gate_proj,0.0001278075,0.05000,2.386 | |
| 25,mlp.up_proj,0.0000906748,0.05000,2.420 | |
| 25,mlp.down_proj,0.0000087553,0.05000,2.930 | |
| 26,self_attn.v_proj,0.0000302323,0.05000,4.811 | |
| 26,self_attn.q_proj,0.0000829504,0.05000,4.829 | |
| 26,self_attn.k_proj,0.0000538115,0.05000,4.855 | |
| 26,self_attn.o_proj,0.0000024757,0.05000,1.023 | |
| 26,mlp.up_proj,0.0000947583,0.05000,2.376 | |
| 26,mlp.gate_proj,0.0001355632,0.05000,2.382 | |
| 26,mlp.down_proj,0.0000126745,0.05000,3.007 | |
| 27,self_attn.k_proj,0.0000373252,0.05000,4.704 | |
| 27,self_attn.v_proj,0.0000200833,0.05000,4.782 | |
| 27,self_attn.q_proj,0.0000657733,0.05000,4.821 | |
| 27,self_attn.o_proj,0.0000077384,0.05000,1.004 | |
| 27,mlp.up_proj,0.0001052698,0.05000,2.324 | |
| 27,mlp.gate_proj,0.0001328537,0.05000,2.335 | |
| 27,mlp.down_proj,0.0000376315,0.05000,2.955 | |