| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000000140,0.05000,4.228 | |
| 0,self_attn.v_proj,0.0000000124,0.05000,4.254 | |
| 0,self_attn.q_proj,0.0000000516,0.05000,4.261 | |
| 0,self_attn.o_proj,0.0000004712,0.05000,1.340 | |
| 0,mlp.gate_proj,0.0000012445,0.05000,2.618 | |
| 0,mlp.up_proj,0.0000012150,0.05000,2.659 | |
| 0,mlp.down_proj,0.0000016537,0.05000,10.010 | |
| 1,self_attn.q_proj,0.0000000072,0.05000,4.470 | |
| 1,self_attn.v_proj,0.0000000037,0.05000,4.508 | |
| 1,self_attn.k_proj,0.0000000025,0.05000,4.615 | |
| 1,self_attn.o_proj,0.0000000651,0.05000,1.287 | |
| 1,mlp.up_proj,0.0000018015,0.05000,2.635 | |
| 1,mlp.gate_proj,0.0000018618,0.05000,2.643 | |
| 1,mlp.down_proj,0.0000002155,0.05000,10.157 | |
| 2,self_attn.q_proj,0.0000000276,0.05000,3.988 | |
| 2,self_attn.v_proj,0.0000000083,0.05000,4.042 | |
| 2,self_attn.k_proj,0.0000000079,0.05000,4.085 | |
| 2,self_attn.o_proj,0.0000002534,0.05000,1.433 | |
| 2,mlp.gate_proj,0.0000038101,0.05000,3.364 | |
| 2,mlp.up_proj,0.0000034955,0.05000,3.382 | |
| 2,mlp.down_proj,0.0001161570,0.05000,10.704 | |
| 3,self_attn.v_proj,0.0000000232,0.05000,3.838 | |
| 3,self_attn.q_proj,0.0000000686,0.05000,3.841 | |
| 3,self_attn.k_proj,0.0000000196,0.05000,3.857 | |
| 3,self_attn.o_proj,0.0000004138,0.05000,1.340 | |
| 3,mlp.gate_proj,0.0000050197,0.05000,2.753 | |
| 3,mlp.up_proj,0.0000049241,0.05000,2.766 | |
| 3,mlp.down_proj,0.0000009193,0.05000,10.108 | |
| 4,self_attn.v_proj,0.0000000410,0.05000,3.939 | |
| 4,self_attn.q_proj,0.0000001232,0.05000,3.984 | |
| 4,self_attn.k_proj,0.0000000351,0.05000,3.988 | |
| 4,self_attn.o_proj,0.0000003411,0.05000,1.325 | |
| 4,mlp.gate_proj,0.0000069457,0.05000,2.593 | |
| 4,mlp.up_proj,0.0000066921,0.05000,2.608 | |
| 4,mlp.down_proj,0.0000014823,0.05000,10.176 | |
| 5,self_attn.q_proj,0.0000001865,0.05000,4.672 | |
| 5,self_attn.k_proj,0.0000000512,0.05000,4.691 | |
| 5,self_attn.v_proj,0.0000000594,0.05000,4.783 | |
| 5,self_attn.o_proj,0.0000005891,0.05000,1.296 | |
| 5,mlp.up_proj,0.0000082574,0.05000,2.916 | |
| 5,mlp.gate_proj,0.0000085516,0.05000,2.932 | |
| 5,mlp.down_proj,0.0000019622,0.05000,10.073 | |
| 6,self_attn.q_proj,0.0000003242,0.05000,4.042 | |
| 6,self_attn.k_proj,0.0000000875,0.05000,4.053 | |
| 6,self_attn.v_proj,0.0000001055,0.05000,4.072 | |
| 6,self_attn.o_proj,0.0000007174,0.05000,1.328 | |
| 6,mlp.up_proj,0.0000101675,0.05000,2.792 | |
| 6,mlp.gate_proj,0.0000105692,0.05000,2.805 | |
| 6,mlp.down_proj,0.0000026730,0.05000,10.023 | |
| 7,self_attn.v_proj,0.0000001784,0.05000,4.072 | |
| 7,self_attn.q_proj,0.0000006267,0.05000,4.119 | |
| 7,self_attn.k_proj,0.0000001707,0.05000,4.130 | |
| 7,self_attn.o_proj,0.0000010049,0.05000,1.333 | |
| 7,mlp.up_proj,0.0000117455,0.05000,2.662 | |
| 7,mlp.gate_proj,0.0000123962,0.05000,2.662 | |
| 7,mlp.down_proj,0.0000032665,0.05000,10.283 | |
| 8,self_attn.k_proj,0.0000001502,0.05000,3.955 | |
| 8,self_attn.q_proj,0.0000005414,0.05000,4.013 | |
| 8,self_attn.v_proj,0.0000001743,0.05000,4.020 | |
| 8,self_attn.o_proj,0.0000008939,0.05000,1.346 | |
| 8,mlp.up_proj,0.0000133438,0.05000,2.726 | |
| 8,mlp.gate_proj,0.0000141712,0.05000,2.759 | |
| 8,mlp.down_proj,0.0000041069,0.05000,10.228 | |
| 9,self_attn.k_proj,0.0000001892,0.05000,3.880 | |
| 9,self_attn.v_proj,0.0000002252,0.05000,3.890 | |
| 9,self_attn.q_proj,0.0000006828,0.05000,3.897 | |
| 9,self_attn.o_proj,0.0000012981,0.05000,1.329 | |
| 9,mlp.up_proj,0.0000145487,0.05000,2.761 | |
| 9,mlp.gate_proj,0.0000155021,0.05000,2.767 | |
| 9,mlp.down_proj,0.0000053853,0.05000,10.240 | |
| 10,self_attn.v_proj,0.0000001977,0.05000,3.884 | |
| 10,self_attn.k_proj,0.0000001681,0.05000,3.904 | |
| 10,self_attn.q_proj,0.0000006155,0.05000,3.940 | |
| 10,self_attn.o_proj,0.0000012067,0.05000,1.304 | |
| 10,mlp.gate_proj,0.0000176100,0.05000,2.610 | |
| 10,mlp.up_proj,0.0000166075,0.05000,2.618 | |
| 10,mlp.down_proj,0.0000068149,0.05000,10.222 | |
| 11,self_attn.v_proj,0.0000002852,0.05000,3.778 | |
| 11,self_attn.q_proj,0.0000009002,0.05000,3.850 | |
| 11,self_attn.k_proj,0.0000002500,0.05000,3.867 | |
| 11,self_attn.o_proj,0.0000018442,0.05000,1.320 | |
| 11,mlp.gate_proj,0.0000201731,0.05000,2.687 | |
| 11,mlp.up_proj,0.0000191793,0.05000,2.698 | |
| 11,mlp.down_proj,0.0000086002,0.05000,10.109 | |
| 12,self_attn.q_proj,0.0000011658,0.05000,4.134 | |
| 12,self_attn.k_proj,0.0000003200,0.05000,4.163 | |
| 12,self_attn.v_proj,0.0000003403,0.05000,4.199 | |
| 12,self_attn.o_proj,0.0000022016,0.05000,1.331 | |
| 12,mlp.gate_proj,0.0000228206,0.05000,2.753 | |
| 12,mlp.up_proj,0.0000217454,0.05000,2.783 | |
| 12,mlp.down_proj,0.0000103251,0.05000,10.118 | |
| 13,self_attn.q_proj,0.0000016596,0.05000,4.651 | |
| 13,self_attn.k_proj,0.0000004465,0.05000,4.675 | |
| 13,self_attn.v_proj,0.0000004538,0.05000,4.773 | |
| 13,self_attn.o_proj,0.0000030352,0.05000,1.368 | |
| 13,mlp.gate_proj,0.0000262297,0.05000,2.604 | |
| 13,mlp.up_proj,0.0000248712,0.05000,2.617 | |
| 13,mlp.down_proj,0.0000138197,0.05000,10.216 | |
| 14,self_attn.v_proj,0.0000003687,0.05000,4.427 | |
| 14,self_attn.q_proj,0.0000012519,0.05000,4.455 | |
| 14,self_attn.k_proj,0.0000003375,0.05000,4.480 | |
| 14,self_attn.o_proj,0.0000038044,0.05000,1.326 | |
| 14,mlp.gate_proj,0.0000287475,0.05000,2.522 | |
| 14,mlp.up_proj,0.0000274835,0.05000,2.535 | |
| 14,mlp.down_proj,0.0000172711,0.05000,10.170 | |
| 15,self_attn.k_proj,0.0000003946,0.05000,3.913 | |
| 15,self_attn.v_proj,0.0000004614,0.05000,3.924 | |
| 15,self_attn.q_proj,0.0000014636,0.05000,3.937 | |
| 15,self_attn.o_proj,0.0000056492,0.05000,1.366 | |
| 15,mlp.up_proj,0.0000298630,0.05000,3.639 | |
| 15,mlp.gate_proj,0.0000309857,0.05000,3.675 | |
| 15,mlp.down_proj,0.0000209429,0.05000,10.678 | |
| 16,self_attn.q_proj,0.0000019552,0.05000,4.069 | |
| 16,self_attn.v_proj,0.0000006043,0.05000,4.116 | |
| 16,self_attn.k_proj,0.0000005119,0.05000,4.120 | |
| 16,self_attn.o_proj,0.0000086031,0.05000,1.357 | |
| 16,mlp.gate_proj,0.0000331222,0.05000,2.868 | |
| 16,mlp.up_proj,0.0000318690,0.05000,2.875 | |
| 16,mlp.down_proj,0.0000264157,0.05000,10.113 | |
| 17,self_attn.v_proj,0.0000008096,0.05000,4.083 | |
| 17,self_attn.k_proj,0.0000007743,0.05000,4.092 | |
| 17,self_attn.q_proj,0.0000030872,0.05000,4.102 | |
| 17,self_attn.o_proj,0.0000089122,0.05000,1.335 | |
| 17,mlp.up_proj,0.0000352217,0.05000,2.779 | |
| 17,mlp.gate_proj,0.0000359954,0.05000,2.788 | |
| 17,mlp.down_proj,0.0000333995,0.05000,10.093 | |
| 18,self_attn.v_proj,0.0000010487,0.05000,3.910 | |
| 18,self_attn.k_proj,0.0000009329,0.05000,3.957 | |
| 18,self_attn.q_proj,0.0000036158,0.05000,3.967 | |
| 18,self_attn.o_proj,0.0000114618,0.05000,1.371 | |
| 18,mlp.gate_proj,0.0000416992,0.05000,2.798 | |
| 18,mlp.up_proj,0.0000407445,0.05000,2.805 | |
| 18,mlp.down_proj,0.0000406941,0.05000,10.168 | |
| 19,self_attn.q_proj,0.0000041974,0.05000,3.933 | |
| 19,self_attn.k_proj,0.0000010693,0.05000,3.947 | |
| 19,self_attn.v_proj,0.0000011832,0.05000,3.958 | |
| 19,self_attn.o_proj,0.0000157908,0.05000,1.329 | |
| 19,mlp.up_proj,0.0000455992,0.05000,2.827 | |
| 19,mlp.gate_proj,0.0000466300,0.05000,2.832 | |
| 19,mlp.down_proj,0.0000491709,0.05000,10.111 | |
| 20,self_attn.v_proj,0.0000020002,0.05000,4.173 | |
| 20,self_attn.q_proj,0.0000071319,0.05000,4.172 | |
| 20,self_attn.k_proj,0.0000018153,0.05000,4.195 | |
| 20,self_attn.o_proj,0.0000147102,0.05000,1.360 | |
| 20,mlp.up_proj,0.0000479768,0.05000,2.800 | |
| 20,mlp.gate_proj,0.0000485186,0.05000,2.806 | |
| 20,mlp.down_proj,0.0000547845,0.05000,10.333 | |
| 21,self_attn.v_proj,0.0000018913,0.05000,3.771 | |
| 21,self_attn.q_proj,0.0000072509,0.05000,3.800 | |
| 21,self_attn.k_proj,0.0000018171,0.05000,3.812 | |
| 21,self_attn.o_proj,0.0000254666,0.05000,1.289 | |
| 21,mlp.gate_proj,0.0000515644,0.05000,2.693 | |
| 21,mlp.up_proj,0.0000515692,0.05000,2.708 | |
| 21,mlp.down_proj,0.0000666307,0.05000,10.221 | |
| 22,self_attn.q_proj,0.0000073657,0.05000,4.125 | |
| 22,self_attn.v_proj,0.0000020441,0.05000,4.173 | |
| 22,self_attn.k_proj,0.0000018628,0.05000,4.191 | |
| 22,self_attn.o_proj,0.0000277880,0.05000,1.339 | |
| 22,mlp.up_proj,0.0000568401,0.05000,2.764 | |
| 22,mlp.gate_proj,0.0000567090,0.05000,2.772 | |
| 22,mlp.down_proj,0.0000785028,0.05000,10.157 | |
| 23,self_attn.k_proj,0.0000022589,0.05000,4.088 | |
| 23,self_attn.v_proj,0.0000025075,0.05000,4.116 | |
| 23,self_attn.q_proj,0.0000088587,0.05000,4.123 | |
| 23,self_attn.o_proj,0.0000189992,0.05000,1.296 | |
| 23,mlp.up_proj,0.0000619590,0.05000,3.170 | |
| 23,mlp.gate_proj,0.0000618049,0.05000,3.192 | |
| 23,mlp.down_proj,0.0000903521,0.05000,10.260 | |
| 24,self_attn.q_proj,0.0000126329,0.05000,3.951 | |
| 24,self_attn.v_proj,0.0000035166,0.05000,3.964 | |
| 24,self_attn.k_proj,0.0000031720,0.05000,3.980 | |
| 24,self_attn.o_proj,0.0000331288,0.05000,1.380 | |
| 24,mlp.gate_proj,0.0000658429,0.05000,2.858 | |
| 24,mlp.up_proj,0.0000665991,0.05000,2.876 | |
| 24,mlp.down_proj,0.0001003864,0.05000,10.256 | |
| 25,self_attn.q_proj,0.0000124622,0.05000,3.837 | |
| 25,self_attn.k_proj,0.0000031018,0.05000,3.862 | |
| 25,self_attn.v_proj,0.0000033371,0.05000,3.876 | |
| 25,self_attn.o_proj,0.0000359184,0.05000,1.344 | |
| 25,mlp.gate_proj,0.0000694823,0.05000,2.605 | |
| 25,mlp.up_proj,0.0000707069,0.05000,2.620 | |
| 25,mlp.down_proj,0.0001124752,0.05000,10.744 | |
| 26,self_attn.k_proj,0.0000042816,0.05000,3.783 | |
| 26,self_attn.v_proj,0.0000045993,0.05000,3.805 | |
| 26,self_attn.q_proj,0.0000170768,0.05000,3.812 | |
| 26,self_attn.o_proj,0.0000472656,0.05000,1.307 | |
| 26,mlp.gate_proj,0.0000753305,0.05000,2.946 | |
| 26,mlp.up_proj,0.0000769087,0.05000,2.976 | |
| 26,mlp.down_proj,0.0001320378,0.05000,10.588 | |
| 27,self_attn.v_proj,0.0000049317,0.05000,3.854 | |
| 27,self_attn.q_proj,0.0000179868,0.05000,3.879 | |
| 27,self_attn.k_proj,0.0000043449,0.05000,3.884 | |
| 27,self_attn.o_proj,0.0000529636,0.05000,1.400 | |
| 27,mlp.gate_proj,0.0000816187,0.05000,2.784 | |
| 27,mlp.up_proj,0.0000833050,0.05000,2.796 | |
| 27,mlp.down_proj,0.0001532338,0.05000,10.255 | |
| 28,self_attn.v_proj,0.0000095983,0.05000,4.067 | |
| 28,self_attn.q_proj,0.0000369673,0.05000,4.119 | |
| 28,self_attn.k_proj,0.0000085377,0.05000,4.140 | |
| 28,self_attn.o_proj,0.0000471787,0.05000,1.344 | |
| 28,mlp.gate_proj,0.0000895496,0.05000,2.726 | |
| 28,mlp.up_proj,0.0000922046,0.05000,2.732 | |
| 28,mlp.down_proj,0.0001768752,0.05000,10.292 | |
| 29,self_attn.k_proj,0.0000065192,0.05000,3.884 | |
| 29,self_attn.q_proj,0.0000272154,0.05000,3.926 | |
| 29,self_attn.v_proj,0.0000073348,0.05000,3.932 | |
| 29,self_attn.o_proj,0.0000629508,0.05000,1.333 | |
| 29,mlp.gate_proj,0.0000984423,0.05000,2.682 | |
| 29,mlp.up_proj,0.0001013172,0.05000,2.695 | |
| 29,mlp.down_proj,0.0002126624,0.05000,10.621 | |
| 30,self_attn.k_proj,0.0000069004,0.05000,4.700 | |
| 30,self_attn.v_proj,0.0000073623,0.05000,4.709 | |
| 30,self_attn.q_proj,0.0000281760,0.05000,4.788 | |
| 30,self_attn.o_proj,0.0000648010,0.05000,1.380 | |
| 30,mlp.up_proj,0.0001067660,0.05000,2.688 | |
| 30,mlp.gate_proj,0.0001031451,0.05000,2.698 | |
| 30,mlp.down_proj,0.0002539282,0.05000,10.252 | |
| 31,self_attn.v_proj,0.0000076392,0.05000,3.900 | |
| 31,self_attn.k_proj,0.0000072253,0.05000,3.958 | |
| 31,self_attn.q_proj,0.0000287567,0.05000,3.974 | |
| 31,self_attn.o_proj,0.0000631732,0.05000,1.394 | |
| 31,mlp.gate_proj,0.0001077778,0.05000,3.043 | |
| 31,mlp.up_proj,0.0001128011,0.05000,3.052 | |
| 31,mlp.down_proj,0.0002918915,0.05000,10.297 | |
| 32,self_attn.q_proj,0.0000360973,0.05000,4.621 | |
| 32,self_attn.v_proj,0.0000093422,0.05000,4.698 | |
| 32,self_attn.k_proj,0.0000089061,0.05000,4.764 | |
| 32,self_attn.o_proj,0.0001097469,0.05000,1.352 | |
| 32,mlp.gate_proj,0.0001155008,0.05000,4.010 | |
| 32,mlp.up_proj,0.0001210627,0.05000,4.097 | |
| 32,mlp.down_proj,0.0003264303,0.05000,10.311 | |
| 33,self_attn.q_proj,0.0000374045,0.05000,4.079 | |
| 33,self_attn.k_proj,0.0000091973,0.05000,4.119 | |
| 33,self_attn.v_proj,0.0000100351,0.05000,4.141 | |
| 33,self_attn.o_proj,0.0000995914,0.05000,1.348 | |
| 33,mlp.gate_proj,0.0001323207,0.05000,2.767 | |
| 33,mlp.up_proj,0.0001374208,0.05000,2.778 | |
| 33,mlp.down_proj,0.0003775333,0.05000,10.387 | |
| 34,self_attn.q_proj,0.0000466289,0.05000,4.343 | |
| 34,self_attn.k_proj,0.0000115436,0.05000,4.368 | |
| 34,self_attn.v_proj,0.0000125697,0.05000,4.403 | |
| 34,self_attn.o_proj,0.0000789440,0.05000,1.385 | |
| 34,mlp.gate_proj,0.0001364812,0.05000,2.833 | |
| 34,mlp.up_proj,0.0001426274,0.05000,2.856 | |
| 34,mlp.down_proj,0.0004581308,0.05000,10.545 | |
| 35,self_attn.k_proj,0.0000128505,0.05000,3.844 | |
| 35,self_attn.v_proj,0.0000139194,0.05000,3.875 | |
| 35,self_attn.q_proj,0.0000515437,0.05000,3.908 | |
| 35,self_attn.o_proj,0.0001699727,0.05000,1.321 | |
| 35,mlp.gate_proj,0.0001478171,0.05000,2.790 | |
| 35,mlp.up_proj,0.0001537258,0.05000,2.799 | |
| 35,mlp.down_proj,0.0005565927,0.05000,10.410 | |
| 36,self_attn.q_proj,0.0000797258,0.05000,4.274 | |
| 36,self_attn.v_proj,0.0000207318,0.05000,4.382 | |
| 36,self_attn.k_proj,0.0000191691,0.05000,4.393 | |
| 36,self_attn.o_proj,0.0001257938,0.05000,1.404 | |
| 36,mlp.gate_proj,0.0001650040,0.05000,2.942 | |
| 36,mlp.up_proj,0.0001715282,0.05000,2.942 | |
| 36,mlp.down_proj,0.0006687486,0.05000,10.175 | |
| 37,self_attn.k_proj,0.0000152798,0.05000,4.614 | |
| 37,self_attn.v_proj,0.0000172244,0.05000,4.638 | |
| 37,self_attn.q_proj,0.0000617838,0.05000,4.668 | |
| 37,self_attn.o_proj,0.0001763066,0.05000,1.353 | |
| 37,mlp.gate_proj,0.0001785817,0.05000,3.439 | |
| 37,mlp.up_proj,0.0001860518,0.05000,3.462 | |
| 37,mlp.down_proj,0.0008244158,0.05000,10.256 | |
| 38,self_attn.v_proj,0.0000186834,0.05000,3.811 | |
| 38,self_attn.k_proj,0.0000174050,0.05000,3.822 | |
| 38,self_attn.q_proj,0.0000738627,0.05000,3.900 | |
| 38,self_attn.o_proj,0.0001695878,0.05000,1.347 | |
| 38,mlp.gate_proj,0.0001969437,0.05000,2.807 | |
| 38,mlp.up_proj,0.0002052122,0.05000,2.822 | |
| 38,mlp.down_proj,0.0009937251,0.05000,10.399 | |
| 39,self_attn.q_proj,0.0000827328,0.05000,4.900 | |
| 39,self_attn.v_proj,0.0000207759,0.05000,4.930 | |
| 39,self_attn.k_proj,0.0000197080,0.05000,5.042 | |
| 39,self_attn.o_proj,0.0002096921,0.05000,1.397 | |
| 39,mlp.gate_proj,0.0002047116,0.05000,3.361 | |
| 39,mlp.up_proj,0.0002140854,0.05000,3.386 | |
| 39,mlp.down_proj,0.0011548433,0.05000,10.094 | |
| 40,self_attn.q_proj,0.0001057319,0.05000,4.833 | |
| 40,self_attn.v_proj,0.0000296387,0.05000,4.905 | |
| 40,self_attn.k_proj,0.0000270235,0.05000,4.985 | |
| 40,self_attn.o_proj,0.0002634869,0.05000,1.383 | |
| 40,mlp.gate_proj,0.0002189473,0.05000,3.206 | |
| 40,mlp.up_proj,0.0002252337,0.05000,3.250 | |
| 40,mlp.down_proj,0.0011317164,0.05000,10.291 | |
| 41,self_attn.q_proj,0.0000998817,0.05000,3.800 | |
| 41,self_attn.k_proj,0.0000247796,0.05000,3.861 | |
| 41,self_attn.v_proj,0.0000275091,0.05000,3.871 | |
| 41,self_attn.o_proj,0.0002409238,0.05000,1.352 | |
| 41,mlp.up_proj,0.0002361619,0.05000,2.584 | |
| 41,mlp.gate_proj,0.0002315405,0.05000,2.590 | |
| 41,mlp.down_proj,0.0012460639,0.05000,10.348 | |
| 42,self_attn.q_proj,0.0000925230,0.05000,4.010 | |
| 42,self_attn.k_proj,0.0000238275,0.05000,4.052 | |
| 42,self_attn.v_proj,0.0000273165,0.05000,4.069 | |
| 42,self_attn.o_proj,0.0002579076,0.05000,1.473 | |
| 42,mlp.up_proj,0.0002452240,0.05000,2.846 | |
| 42,mlp.gate_proj,0.0002425512,0.05000,2.867 | |
| 42,mlp.down_proj,0.0013256914,0.05000,10.333 | |
| 43,self_attn.v_proj,0.0000520243,0.05000,4.805 | |
| 43,self_attn.k_proj,0.0000466363,0.05000,4.823 | |
| 43,self_attn.q_proj,0.0001848763,0.05000,4.894 | |
| 43,self_attn.o_proj,0.0003697739,0.05000,1.383 | |
| 43,mlp.up_proj,0.0002634521,0.05000,2.661 | |
| 43,mlp.gate_proj,0.0002616286,0.05000,2.668 | |
| 43,mlp.down_proj,0.0014734533,0.05000,10.517 | |
| 44,self_attn.k_proj,0.0000289557,0.05000,3.680 | |
| 44,self_attn.q_proj,0.0001133079,0.05000,3.697 | |
| 44,self_attn.v_proj,0.0000337912,0.05000,3.709 | |
| 44,self_attn.o_proj,0.0002062722,0.05000,1.369 | |
| 44,mlp.up_proj,0.0002785884,0.05000,2.733 | |
| 44,mlp.gate_proj,0.0002770756,0.05000,2.738 | |
| 44,mlp.down_proj,0.0015221004,0.05000,10.282 | |
| 45,self_attn.k_proj,0.0000289393,0.05000,4.044 | |
| 45,self_attn.v_proj,0.0000350490,0.05000,4.111 | |
| 45,self_attn.q_proj,0.0001110882,0.05000,4.143 | |
| 45,self_attn.o_proj,0.0002006233,0.05000,1.346 | |
| 45,mlp.up_proj,0.0002906391,0.05000,3.571 | |
| 45,mlp.gate_proj,0.0002894125,0.05000,3.605 | |
| 45,mlp.down_proj,0.0016516784,0.05000,10.393 | |
| 46,self_attn.q_proj,0.0001905171,0.05000,4.896 | |
| 46,self_attn.k_proj,0.0000505726,0.05000,5.053 | |
| 46,self_attn.v_proj,0.0000590429,0.05000,5.130 | |
| 46,self_attn.o_proj,0.0003257566,0.05000,1.337 | |
| 46,mlp.gate_proj,0.0003047601,0.05000,3.081 | |
| 46,mlp.up_proj,0.0003055655,0.05000,3.097 | |
| 46,mlp.down_proj,0.0017683138,0.05000,10.817 | |
| 47,self_attn.v_proj,0.0000557610,0.05000,4.544 | |
| 47,self_attn.q_proj,0.0001796675,0.05000,4.587 | |
| 47,self_attn.k_proj,0.0000467443,0.05000,4.682 | |
| 47,self_attn.o_proj,0.0002222129,0.05000,1.330 | |
| 47,mlp.gate_proj,0.0003170164,0.05000,3.908 | |
| 47,mlp.up_proj,0.0003180911,0.05000,3.956 | |
| 47,mlp.down_proj,0.0018363868,0.05000,10.267 | |
| 48,self_attn.q_proj,0.0001660057,0.05000,3.950 | |
| 48,self_attn.k_proj,0.0000447051,0.05000,3.969 | |
| 48,self_attn.v_proj,0.0000531446,0.05000,3.998 | |
| 48,self_attn.o_proj,0.0002315272,0.05000,1.355 | |
| 48,mlp.gate_proj,0.0003298499,0.05000,2.860 | |
| 48,mlp.up_proj,0.0003311301,0.05000,2.876 | |
| 48,mlp.down_proj,0.0019524008,0.05000,10.294 | |
| 49,self_attn.q_proj,0.0001606421,0.05000,4.927 | |
| 49,self_attn.k_proj,0.0000423833,0.05000,5.058 | |
| 49,self_attn.v_proj,0.0000503879,0.05000,5.127 | |
| 49,self_attn.o_proj,0.0002362852,0.05000,1.371 | |
| 49,mlp.gate_proj,0.0003447860,0.05000,2.576 | |
| 49,mlp.up_proj,0.0003473626,0.05000,2.585 | |
| 49,mlp.down_proj,0.0021022653,0.05000,10.278 | |
| 50,self_attn.q_proj,0.0002281217,0.05000,3.814 | |
| 50,self_attn.k_proj,0.0000606198,0.05000,3.875 | |
| 50,self_attn.v_proj,0.0000708845,0.05000,3.901 | |
| 50,self_attn.o_proj,0.0001992800,0.05000,1.354 | |
| 50,mlp.gate_proj,0.0003591935,0.05000,2.549 | |
| 50,mlp.up_proj,0.0003640025,0.05000,2.565 | |
| 50,mlp.down_proj,0.0022086803,0.05000,10.172 | |
| 51,self_attn.q_proj,0.0003117771,0.05000,3.700 | |
| 51,self_attn.v_proj,0.0001091466,0.05000,3.709 | |
| 51,self_attn.k_proj,0.0000827853,0.05000,3.734 | |
| 51,self_attn.o_proj,0.0002843714,0.05000,1.404 | |
| 51,mlp.up_proj,0.0003836008,0.05000,2.636 | |
| 51,mlp.gate_proj,0.0003751998,0.05000,2.652 | |
| 51,mlp.down_proj,0.0024183555,0.05000,10.325 | |
| 52,self_attn.q_proj,0.0002297808,0.05000,4.436 | |
| 52,self_attn.k_proj,0.0000618817,0.05000,4.511 | |
| 52,self_attn.v_proj,0.0000758499,0.05000,4.597 | |
| 52,self_attn.o_proj,0.0003008906,0.05000,1.365 | |
| 52,mlp.up_proj,0.0004042250,0.05000,2.651 | |
| 52,mlp.gate_proj,0.0003910684,0.05000,2.661 | |
| 52,mlp.down_proj,0.0026217234,0.05000,10.365 | |
| 53,self_attn.k_proj,0.0000778189,0.05000,4.138 | |
| 53,self_attn.v_proj,0.0000940183,0.05000,4.194 | |
| 53,self_attn.q_proj,0.0002927864,0.05000,4.206 | |
| 53,self_attn.o_proj,0.0002758975,0.05000,1.376 | |
| 53,mlp.gate_proj,0.0004006354,0.05000,3.502 | |
| 53,mlp.up_proj,0.0004195405,0.05000,3.505 | |
| 53,mlp.down_proj,0.0028683171,0.05000,10.321 | |
| 54,self_attn.q_proj,0.0002656220,0.05000,3.875 | |
| 54,self_attn.k_proj,0.0000713738,0.05000,3.940 | |
| 54,self_attn.v_proj,0.0000844272,0.05000,3.994 | |
| 54,self_attn.o_proj,0.0003021094,0.05000,1.360 | |
| 54,mlp.up_proj,0.0004385530,0.05000,3.079 | |
| 54,mlp.gate_proj,0.0004135394,0.05000,3.108 | |
| 54,mlp.down_proj,0.0031359513,0.05000,10.268 | |
| 55,self_attn.q_proj,0.0002820259,0.05000,3.899 | |
| 55,self_attn.v_proj,0.0000954003,0.05000,3.978 | |
| 55,self_attn.k_proj,0.0000767974,0.05000,4.030 | |
| 55,self_attn.o_proj,0.0004446774,0.05000,1.388 | |
| 55,mlp.gate_proj,0.0004257430,0.05000,2.806 | |
| 55,mlp.up_proj,0.0004582367,0.05000,2.828 | |
| 55,mlp.down_proj,0.0034925919,0.05000,10.308 | |
| 56,self_attn.v_proj,0.0001393293,0.05000,4.965 | |
| 56,self_attn.q_proj,0.0003977993,0.05000,4.978 | |
| 56,self_attn.k_proj,0.0001072885,0.05000,5.089 | |
| 56,self_attn.o_proj,0.0003518363,0.05000,1.368 | |
| 56,mlp.gate_proj,0.0004352606,0.05000,2.559 | |
| 56,mlp.up_proj,0.0004752655,0.05000,2.563 | |
| 56,mlp.down_proj,0.0038588382,0.05000,11.496 | |
| 57,self_attn.q_proj,0.0003542808,0.05000,3.993 | |
| 57,self_attn.k_proj,0.0000966569,0.05000,4.015 | |
| 57,self_attn.v_proj,0.0001193342,0.05000,4.022 | |
| 57,self_attn.o_proj,0.0005018140,0.05000,1.418 | |
| 57,mlp.up_proj,0.0005006724,0.05000,2.886 | |
| 57,mlp.gate_proj,0.0004533908,0.05000,2.894 | |
| 57,mlp.down_proj,0.0045296988,0.05000,10.439 | |
| 58,self_attn.v_proj,0.0000663065,0.05000,4.624 | |
| 58,self_attn.q_proj,0.0002042950,0.05000,4.665 | |
| 58,self_attn.k_proj,0.0000554576,0.05000,4.682 | |
| 58,self_attn.o_proj,0.0003437978,0.05000,1.561 | |
| 58,mlp.gate_proj,0.0004639400,0.05000,3.624 | |
| 58,mlp.up_proj,0.0005164678,0.05000,3.659 | |
| 58,mlp.down_proj,0.0045223694,0.05000,10.299 | |
| 59,self_attn.v_proj,0.0001045671,0.05000,4.096 | |
| 59,self_attn.k_proj,0.0000813153,0.05000,4.130 | |
| 59,self_attn.q_proj,0.0003104069,0.05000,4.148 | |
| 59,self_attn.o_proj,0.0004785528,0.05000,1.353 | |
| 59,mlp.gate_proj,0.0004818735,0.05000,2.698 | |
| 59,mlp.up_proj,0.0005385825,0.05000,2.700 | |
| 59,mlp.down_proj,0.0050474849,0.05000,10.196 | |
| 60,self_attn.v_proj,0.0001792017,0.05000,4.224 | |
| 60,self_attn.k_proj,0.0001330722,0.05000,4.236 | |
| 60,self_attn.q_proj,0.0004933949,0.05000,4.284 | |
| 60,self_attn.o_proj,0.0012227991,0.05000,1.318 | |
| 60,mlp.up_proj,0.0005378991,0.05000,3.336 | |
| 60,mlp.gate_proj,0.0004821140,0.05000,3.351 | |
| 60,mlp.down_proj,0.0054261735,0.05000,11.159 | |
| 61,self_attn.q_proj,0.0003410577,0.05000,4.815 | |
| 61,self_attn.k_proj,0.0000874063,0.05000,4.859 | |
| 61,self_attn.v_proj,0.0001230454,0.05000,4.949 | |
| 61,self_attn.o_proj,0.0009078037,0.05000,1.336 | |
| 61,mlp.gate_proj,0.0004589384,0.05000,2.764 | |
| 61,mlp.up_proj,0.0005126996,0.05000,2.787 | |
| 61,mlp.down_proj,0.0050377736,0.05000,10.219 | |
| 62,self_attn.v_proj,0.0000604726,0.05000,3.870 | |
| 62,self_attn.k_proj,0.0000453193,0.05000,3.891 | |
| 62,self_attn.q_proj,0.0001719647,0.05000,3.918 | |
| 62,self_attn.o_proj,0.0003095673,0.05000,1.296 | |
| 62,mlp.up_proj,0.0004731684,0.05000,2.713 | |
| 62,mlp.gate_proj,0.0004234769,0.05000,2.730 | |
| 62,mlp.down_proj,0.0049185579,0.05000,10.235 | |
| 63,self_attn.k_proj,0.0000462003,0.05000,4.783 | |
| 63,self_attn.q_proj,0.0001753194,0.05000,4.797 | |
| 63,self_attn.v_proj,0.0000657055,0.05000,4.840 | |
| 63,self_attn.o_proj,0.0003810334,0.05000,1.303 | |
| 63,mlp.up_proj,0.0004539171,0.05000,2.676 | |
| 63,mlp.gate_proj,0.0004178135,0.05000,2.685 | |
| 63,mlp.down_proj,0.0061227955,0.05000,10.255 | |