| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000000529,0.05000,5.639 | |
| 0,self_attn.v_proj,0.0000000459,0.05000,5.749 | |
| 0,self_attn.q_proj,0.0000001946,0.05000,5.781 | |
| 0,self_attn.o_proj,0.0000001205,0.05000,1.680 | |
| 0,mlp.gate_proj,0.0000119312,0.05000,2.209 | |
| 0,mlp.up_proj,0.0000104520,0.05000,2.237 | |
| 0,mlp.down_proj,0.0000016241,0.05000,3.944 | |
| 1,self_attn.q_proj,0.0000003163,0.05000,5.104 | |
| 1,self_attn.v_proj,0.0000000882,0.05000,5.167 | |
| 1,self_attn.k_proj,0.0000000853,0.05000,5.201 | |
| 1,self_attn.o_proj,0.0000001642,0.05000,1.658 | |
| 1,mlp.up_proj,0.0001817668,0.05000,2.850 | |
| 1,mlp.gate_proj,0.0004014041,0.05000,2.881 | |
| 1,mlp.down_proj,0.0000017688,0.05000,4.370 | |
| 2,self_attn.q_proj,0.0000008970,0.05000,5.286 | |
| 2,self_attn.k_proj,0.0000002566,0.05000,5.321 | |
| 2,self_attn.v_proj,0.0000002510,0.05000,5.343 | |
| 2,self_attn.o_proj,0.0000002251,0.05000,1.713 | |
| 2,mlp.gate_proj,0.0006498467,0.05000,2.413 | |
| 2,mlp.up_proj,0.0005177948,0.05000,2.438 | |
| 2,mlp.down_proj,0.0000012732,0.05000,4.137 | |
| 3,self_attn.q_proj,0.0000017194,0.05000,4.685 | |
| 3,self_attn.k_proj,0.0000004413,0.05000,4.758 | |
| 3,self_attn.v_proj,0.0000004548,0.05000,4.772 | |
| 3,self_attn.o_proj,0.0000003429,0.05000,1.565 | |
| 3,mlp.gate_proj,0.0006881107,0.05000,2.288 | |
| 3,mlp.up_proj,0.0003561646,0.05000,2.318 | |
| 3,mlp.down_proj,0.0000036292,0.05000,4.141 | |
| 4,self_attn.v_proj,0.0000008922,0.05000,4.747 | |
| 4,self_attn.q_proj,0.0000032643,0.05000,4.819 | |
| 4,self_attn.k_proj,0.0000008853,0.05000,4.835 | |
| 4,self_attn.o_proj,0.0000005458,0.05000,1.590 | |
| 4,mlp.gate_proj,0.0005724557,0.05000,2.200 | |
| 4,mlp.up_proj,0.0002293439,0.05000,2.225 | |
| 4,mlp.down_proj,0.0000055330,0.05000,4.094 | |
| 5,self_attn.q_proj,0.0000035649,0.05000,4.698 | |
| 5,self_attn.v_proj,0.0000009740,0.05000,4.701 | |
| 5,self_attn.k_proj,0.0000009058,0.05000,4.750 | |
| 5,self_attn.o_proj,0.0000009772,0.05000,1.573 | |
| 5,mlp.gate_proj,0.0002079280,0.05000,2.225 | |
| 5,mlp.up_proj,0.0001013186,0.05000,2.242 | |
| 5,mlp.down_proj,0.0000081773,0.05000,4.052 | |
| 6,self_attn.v_proj,0.0000020665,0.05000,4.633 | |
| 6,self_attn.k_proj,0.0000018139,0.05000,4.651 | |
| 6,self_attn.q_proj,0.0000076765,0.05000,4.707 | |
| 6,self_attn.o_proj,0.0000023579,0.05000,1.543 | |
| 6,mlp.gate_proj,0.0002195186,0.05000,2.175 | |
| 6,mlp.up_proj,0.0001256842,0.05000,2.209 | |
| 6,mlp.down_proj,0.0001805787,0.05000,4.051 | |
| 7,self_attn.k_proj,0.0000041912,0.05000,4.737 | |
| 7,self_attn.q_proj,0.0000155375,0.05000,4.792 | |
| 7,self_attn.v_proj,0.0000043051,0.05000,4.791 | |
| 7,self_attn.o_proj,0.0000028798,0.05000,1.601 | |
| 7,mlp.up_proj,0.0001527545,0.05000,2.254 | |
| 7,mlp.gate_proj,0.0002531733,0.05000,2.284 | |
| 7,mlp.down_proj,0.0000135267,0.05000,4.097 | |
| 8,self_attn.k_proj,0.0000061028,0.05000,4.791 | |
| 8,self_attn.v_proj,0.0000066735,0.05000,4.804 | |
| 8,self_attn.q_proj,0.0000235807,0.05000,4.855 | |
| 8,self_attn.o_proj,0.0000041072,0.05000,1.567 | |
| 8,mlp.up_proj,0.0001451299,0.05000,2.221 | |
| 8,mlp.gate_proj,0.0001770070,0.05000,2.239 | |
| 8,mlp.down_proj,0.0000203039,0.05000,4.053 | |
| 9,self_attn.q_proj,0.0000290558,0.05000,4.707 | |
| 9,self_attn.v_proj,0.0000080488,0.05000,4.772 | |
| 9,self_attn.k_proj,0.0000081565,0.05000,4.789 | |
| 9,self_attn.o_proj,0.0000045795,0.05000,1.552 | |
| 9,mlp.up_proj,0.0001810021,0.05000,2.156 | |
| 9,mlp.gate_proj,0.0002832804,0.05000,2.183 | |
| 9,mlp.down_proj,0.0000204025,0.05000,4.116 | |
| 10,self_attn.q_proj,0.0000428730,0.05000,4.681 | |
| 10,self_attn.k_proj,0.0000110682,0.05000,4.728 | |
| 10,self_attn.v_proj,0.0000127939,0.05000,4.753 | |
| 10,self_attn.o_proj,0.0000070710,0.05000,1.515 | |
| 10,mlp.gate_proj,0.0002172222,0.05000,2.220 | |
| 10,mlp.up_proj,0.0001513125,0.05000,2.218 | |
| 10,mlp.down_proj,0.0000166309,0.05000,4.037 | |
| 11,self_attn.k_proj,0.0000055936,0.05000,4.616 | |
| 11,self_attn.q_proj,0.0000206081,0.05000,4.677 | |
| 11,self_attn.v_proj,0.0000057883,0.05000,4.701 | |
| 11,self_attn.o_proj,0.0000043435,0.05000,1.481 | |
| 11,mlp.up_proj,0.0001400455,0.05000,2.178 | |
| 11,mlp.gate_proj,0.0001772193,0.05000,2.182 | |
| 11,mlp.down_proj,0.0000154659,0.05000,4.043 | |
| 12,self_attn.k_proj,0.0000063814,0.05000,4.536 | |
| 12,self_attn.q_proj,0.0000242027,0.05000,4.576 | |
| 12,self_attn.v_proj,0.0000068583,0.05000,4.605 | |
| 12,self_attn.o_proj,0.0000050332,0.05000,1.562 | |
| 12,mlp.up_proj,0.0001370627,0.05000,2.161 | |
| 12,mlp.gate_proj,0.0001573160,0.05000,2.180 | |
| 12,mlp.down_proj,0.0000155309,0.05000,3.970 | |
| 13,self_attn.v_proj,0.0000047044,0.05000,4.507 | |
| 13,self_attn.q_proj,0.0000184363,0.05000,4.572 | |
| 13,self_attn.k_proj,0.0000048823,0.05000,4.595 | |
| 13,self_attn.o_proj,0.0000040465,0.05000,1.519 | |
| 13,mlp.up_proj,0.0001393028,0.05000,2.214 | |
| 13,mlp.gate_proj,0.0001458737,0.05000,2.229 | |
| 13,mlp.down_proj,0.0000165562,0.05000,3.984 | |
| 14,self_attn.k_proj,0.0000078433,0.05000,4.434 | |
| 14,self_attn.v_proj,0.0000083064,0.05000,4.512 | |
| 14,self_attn.q_proj,0.0000305769,0.05000,4.529 | |
| 14,self_attn.o_proj,0.0000068696,0.05000,1.534 | |
| 14,mlp.gate_proj,0.0001425182,0.05000,2.143 | |
| 14,mlp.up_proj,0.0001369667,0.05000,2.165 | |
| 14,mlp.down_proj,0.0000144339,0.05000,3.994 | |
| 15,self_attn.k_proj,0.0000078901,0.05000,4.457 | |
| 15,self_attn.q_proj,0.0000304238,0.05000,4.517 | |
| 15,self_attn.v_proj,0.0000075067,0.05000,4.547 | |
| 15,self_attn.o_proj,0.0000057910,0.05000,1.549 | |
| 15,mlp.gate_proj,0.0001314416,0.05000,2.075 | |
| 15,mlp.up_proj,0.0001308323,0.05000,2.096 | |
| 15,mlp.down_proj,0.0000141322,0.05000,4.025 | |
| 16,self_attn.q_proj,0.0000527059,0.05000,4.588 | |
| 16,self_attn.k_proj,0.0000129936,0.05000,4.645 | |
| 16,self_attn.v_proj,0.0000147963,0.05000,4.672 | |
| 16,self_attn.o_proj,0.0000062181,0.05000,1.554 | |
| 16,mlp.up_proj,0.0001370881,0.05000,2.170 | |
| 16,mlp.gate_proj,0.0001460451,0.05000,2.173 | |
| 16,mlp.down_proj,0.0001291258,0.05000,4.031 | |
| 17,self_attn.k_proj,0.0000099961,0.05000,4.611 | |
| 17,self_attn.v_proj,0.0000111945,0.05000,4.684 | |
| 17,self_attn.q_proj,0.0000450757,0.05000,4.705 | |
| 17,self_attn.o_proj,0.0000065814,0.05000,1.551 | |
| 17,mlp.up_proj,0.0001229390,0.05000,2.229 | |
| 17,mlp.gate_proj,0.0001291509,0.05000,2.260 | |
| 17,mlp.down_proj,0.0000138228,0.05000,4.005 | |
| 18,self_attn.q_proj,0.0000491217,0.05000,4.514 | |
| 18,self_attn.k_proj,0.0000119304,0.05000,4.544 | |
| 18,self_attn.v_proj,0.0000134876,0.05000,4.585 | |
| 18,self_attn.o_proj,0.0000080063,0.05000,1.528 | |
| 18,mlp.up_proj,0.0001347442,0.05000,2.151 | |
| 18,mlp.gate_proj,0.0001388276,0.05000,2.173 | |
| 18,mlp.down_proj,0.0000170619,0.05000,4.005 | |
| 19,self_attn.k_proj,0.0000229575,0.05000,4.624 | |
| 19,self_attn.q_proj,0.0000984122,0.05000,4.668 | |
| 19,self_attn.v_proj,0.0000236798,0.05000,4.691 | |
| 19,self_attn.o_proj,0.0000106329,0.05000,1.582 | |
| 19,mlp.up_proj,0.0001514618,0.05000,2.286 | |
| 19,mlp.gate_proj,0.0001546628,0.05000,2.302 | |
| 19,mlp.down_proj,0.0000227354,0.05000,4.005 | |
| 20,self_attn.q_proj,0.0000933378,0.05000,4.620 | |
| 20,self_attn.v_proj,0.0000220575,0.05000,4.667 | |
| 20,self_attn.k_proj,0.0000202215,0.05000,4.695 | |
| 20,self_attn.o_proj,0.0000106457,0.05000,1.588 | |
| 20,mlp.up_proj,0.0001666797,0.05000,2.134 | |
| 20,mlp.gate_proj,0.0001662707,0.05000,2.132 | |
| 20,mlp.down_proj,0.0000256278,0.05000,3.855 | |
| 21,self_attn.q_proj,0.0001202196,0.05000,4.409 | |
| 21,self_attn.k_proj,0.0000271532,0.05000,4.460 | |
| 21,self_attn.v_proj,0.0000298576,0.05000,4.463 | |
| 21,self_attn.o_proj,0.0000127776,0.05000,1.502 | |
| 21,mlp.gate_proj,0.0002019959,0.05000,2.158 | |
| 21,mlp.up_proj,0.0002010829,0.05000,2.176 | |
| 21,mlp.down_proj,0.0000345897,0.05000,3.940 | |
| 22,self_attn.k_proj,0.0000543410,0.05000,4.310 | |
| 22,self_attn.v_proj,0.0000614177,0.05000,4.389 | |
| 22,self_attn.q_proj,0.0002431058,0.05000,4.428 | |
| 22,self_attn.o_proj,0.0000251777,0.05000,1.475 | |
| 22,mlp.gate_proj,0.0002430665,0.05000,2.006 | |
| 22,mlp.up_proj,0.0002305638,0.05000,2.024 | |
| 22,mlp.down_proj,0.0000551142,0.05000,4.117 | |
| 23,self_attn.k_proj,0.0000548529,0.05000,4.693 | |
| 23,self_attn.q_proj,0.0002422710,0.05000,4.733 | |
| 23,self_attn.v_proj,0.0000634447,0.05000,4.766 | |
| 23,self_attn.o_proj,0.0000301494,0.05000,1.571 | |
| 23,mlp.up_proj,0.0002738696,0.05000,2.283 | |
| 23,mlp.gate_proj,0.0003045300,0.05000,2.310 | |
| 23,mlp.down_proj,0.0000784298,0.05000,4.072 | |
| 24,self_attn.v_proj,0.0001179669,0.05000,4.527 | |
| 24,self_attn.k_proj,0.0000914282,0.05000,4.581 | |
| 24,self_attn.q_proj,0.0003977864,0.05000,4.606 | |
| 24,self_attn.o_proj,0.0000348926,0.05000,1.539 | |
| 24,mlp.up_proj,0.0003071852,0.05000,2.174 | |
| 24,mlp.gate_proj,0.0003468198,0.05000,2.199 | |
| 24,mlp.down_proj,0.0000987934,0.05000,4.011 | |
| 25,self_attn.k_proj,0.0000689053,0.05000,4.630 | |
| 25,self_attn.q_proj,0.0002806590,0.05000,4.681 | |
| 25,self_attn.v_proj,0.0000781839,0.05000,4.700 | |
| 25,self_attn.o_proj,0.0000216056,0.05000,1.567 | |
| 25,mlp.gate_proj,0.0004061265,0.05000,2.350 | |
| 25,mlp.up_proj,0.0003546657,0.05000,2.372 | |
| 25,mlp.down_proj,0.0001193259,0.05000,4.131 | |
| 26,self_attn.q_proj,0.0004597529,0.05000,4.504 | |
| 26,self_attn.v_proj,0.0001259534,0.05000,4.592 | |
| 26,self_attn.k_proj,0.0001063583,0.05000,4.603 | |
| 26,self_attn.o_proj,0.0000202876,0.05000,1.588 | |
| 26,mlp.up_proj,0.0004417255,0.05000,2.244 | |
| 26,mlp.gate_proj,0.0004897194,0.05000,2.276 | |
| 26,mlp.down_proj,0.0001446874,0.05000,4.001 | |
| 27,self_attn.v_proj,0.0001698991,0.05000,4.541 | |
| 27,self_attn.q_proj,0.0005717810,0.05000,4.596 | |
| 27,self_attn.k_proj,0.0001285193,0.05000,4.611 | |
| 27,self_attn.o_proj,0.0000299984,0.05000,1.533 | |
| 27,mlp.up_proj,0.0005171644,0.05000,2.243 | |
| 27,mlp.gate_proj,0.0005543040,0.05000,2.272 | |
| 27,mlp.down_proj,0.0002140129,0.05000,4.063 | |
| 28,self_attn.q_proj,0.0006321518,0.05000,4.605 | |
| 28,self_attn.v_proj,0.0001818466,0.05000,4.617 | |
| 28,self_attn.k_proj,0.0001574352,0.05000,4.603 | |
| 28,self_attn.o_proj,0.0000483718,0.05000,1.539 | |
| 28,mlp.gate_proj,0.0006389360,0.05000,2.202 | |
| 28,mlp.up_proj,0.0006213975,0.05000,2.220 | |
| 28,mlp.down_proj,0.0003262202,0.05000,4.026 | |
| 29,self_attn.k_proj,0.0003507194,0.05000,4.563 | |
| 29,self_attn.v_proj,0.0004741120,0.05000,4.606 | |
| 29,self_attn.q_proj,0.0015347515,0.05000,4.631 | |
| 29,self_attn.o_proj,0.0000478133,0.05000,1.528 | |
| 29,mlp.gate_proj,0.0007606724,0.05000,2.246 | |
| 29,mlp.up_proj,0.0007786636,0.05000,2.274 | |
| 29,mlp.down_proj,0.0003562392,0.05000,4.091 | |
| 30,self_attn.k_proj,0.0004426675,0.05000,4.557 | |
| 30,self_attn.q_proj,0.0017618013,0.05000,4.629 | |
| 30,self_attn.v_proj,0.0005607962,0.05000,4.643 | |
| 30,self_attn.o_proj,0.0000970244,0.05000,1.504 | |
| 30,mlp.up_proj,0.0008522944,0.05000,2.130 | |
| 30,mlp.gate_proj,0.0008062162,0.05000,2.169 | |
| 30,mlp.down_proj,0.0004936067,0.05000,4.025 | |
| 31,self_attn.v_proj,0.0008217572,0.05000,4.589 | |
| 31,self_attn.k_proj,0.0005931148,0.05000,4.626 | |
| 31,self_attn.q_proj,0.0022387475,0.05000,4.661 | |
| 31,self_attn.o_proj,0.0000931515,0.05000,1.562 | |
| 31,mlp.up_proj,0.0009072860,0.05000,2.213 | |
| 31,mlp.gate_proj,0.0008159017,0.05000,2.236 | |
| 31,mlp.down_proj,0.0006296246,0.05000,4.061 | |
| 32,self_attn.v_proj,0.0012069424,0.05000,4.608 | |
| 32,self_attn.k_proj,0.0007966917,0.05000,4.655 | |
| 32,self_attn.q_proj,0.0032704534,0.05000,4.695 | |
| 32,self_attn.o_proj,0.0001177748,0.05000,1.529 | |
| 32,mlp.up_proj,0.0009638389,0.05000,2.166 | |
| 32,mlp.gate_proj,0.0008459933,0.05000,2.195 | |
| 32,mlp.down_proj,0.0007726722,0.05000,3.959 | |
| 33,self_attn.q_proj,0.0068431394,0.05000,4.501 | |
| 33,self_attn.v_proj,0.0026603756,0.05000,4.515 | |
| 33,self_attn.k_proj,0.0013990668,0.05000,4.569 | |
| 33,self_attn.o_proj,0.0001440813,0.05000,1.581 | |
| 33,mlp.up_proj,0.0010475062,0.05000,2.215 | |
| 33,mlp.gate_proj,0.0009084458,0.05000,2.241 | |
| 33,mlp.down_proj,0.0009851406,0.05000,3.856 | |
| 34,self_attn.k_proj,0.0012023171,0.05000,4.691 | |
| 34,self_attn.q_proj,0.0053871334,0.05000,4.754 | |
| 34,self_attn.v_proj,0.0020066263,0.05000,4.756 | |
| 34,self_attn.o_proj,0.0002732787,0.05000,1.535 | |
| 34,mlp.gate_proj,0.0010677983,0.05000,2.184 | |
| 34,mlp.up_proj,0.0011509700,0.05000,2.210 | |
| 34,mlp.down_proj,0.0011212979,0.05000,4.006 | |
| 35,self_attn.v_proj,0.0008843137,0.05000,4.681 | |
| 35,self_attn.q_proj,0.0025782813,0.05000,4.733 | |
| 35,self_attn.k_proj,0.0006658983,0.05000,4.775 | |
| 35,self_attn.o_proj,0.0003583769,0.05000,1.576 | |
| 35,mlp.gate_proj,0.0016682997,0.05000,2.171 | |
| 35,mlp.up_proj,0.0017624593,0.05000,2.190 | |
| 35,mlp.down_proj,0.0016827106,0.05000,4.071 | |