| layer,module,loss,samples,damp,time | |
| 0,mlp.up_proj,0.0001139788,0.05000,2.730 | |
| 0,mlp.gate_proj,0.0000816036,0.05000,2.795 | |
| 0,mlp.down_proj,0.0000377002,0.05000,4.770 | |
| 0,self_attn.o_proj,failsafe(rtn): 0.0018692,0.00000,0.109 | |
| 0,self_attn.q_proj,0.0001001703,0.05000,1.919 | |
| 0,self_attn.v_proj,0.0000106359,0.05000,1.957 | |
| 0,self_attn.k_proj,0.0000047556,0.05000,1.986 | |
| 0,self_attn.o_gate,0.0002131306,0.05000,0.668 | |
| 1,mlp.gate_proj,0.0000922236,0.05000,2.276 | |
| 1,mlp.up_proj,0.0000972617,0.05000,2.324 | |
| 1,mlp.down_proj,0.0000252440,0.05000,4.242 | |
| 1,self_attn.k_proj,0.0009685841,0.05000,3.029 | |
| 1,self_attn.v_proj,0.0012306731,0.05000,3.042 | |
| 1,self_attn.o_proj,0.0000305169,0.05000,3.046 | |
| 1,self_attn.q_proj,0.0009535788,0.05000,3.056 | |
| 2,mlp.up_proj,0.0001100573,0.05000,2.292 | |
| 2,mlp.gate_proj,0.0001095413,0.05000,2.300 | |
| 2,mlp.down_proj,0.0000370919,0.05000,4.286 | |
| 2,self_attn.o_proj,0.0000110800,0.05000,3.068 | |
| 2,self_attn.k_proj,0.0005334735,0.05000,3.076 | |
| 2,self_attn.q_proj,0.0005377265,0.05000,3.091 | |
| 2,self_attn.v_proj,0.0006325636,0.05000,3.098 | |
| 3,mlp.gate_proj,0.0002075008,0.05000,2.253 | |
| 3,mlp.up_proj,0.0001834026,0.05000,2.266 | |
| 3,mlp.down_proj,0.0000443207,0.05000,4.216 | |
| 3,self_attn.k_proj,0.0006081858,0.05000,2.982 | |
| 3,self_attn.o_proj,0.0000143159,0.05000,2.998 | |
| 3,self_attn.q_proj,0.0005928294,0.05000,3.001 | |
| 3,self_attn.v_proj,0.0006376988,0.05000,3.006 | |
| 4,mlp.gate_proj,0.0002541536,0.05000,2.246 | |
| 4,mlp.up_proj,0.0002309171,0.05000,2.269 | |
| 4,mlp.down_proj,0.0000493166,0.05000,4.221 | |
| 4,self_attn.o_proj,0.0000122342,0.05000,2.982 | |
| 4,self_attn.k_proj,0.0004441993,0.05000,3.005 | |
| 4,self_attn.q_proj,0.0004346599,0.05000,3.013 | |
| 4,self_attn.v_proj,0.0005252177,0.05000,3.016 | |
| 5,mlp.gate_proj,0.0003129852,0.05000,2.235 | |
| 5,mlp.up_proj,0.0002849567,0.05000,2.251 | |
| 5,mlp.down_proj,0.0000529565,0.05000,4.225 | |
| 5,self_attn.k_proj,0.0004888560,0.05000,3.060 | |
| 5,self_attn.o_proj,0.0000177858,0.05000,3.072 | |
| 5,self_attn.q_proj,0.0004625646,0.05000,3.090 | |
| 5,self_attn.v_proj,0.0005211478,0.05000,3.100 | |
| 6,mlp.up_proj,0.0003545977,0.05000,2.236 | |
| 6,mlp.gate_proj,0.0003844595,0.05000,2.241 | |
| 6,mlp.down_proj,0.0000683268,0.05000,4.189 | |
| 6,self_attn.k_proj,0.0005355791,0.05000,2.961 | |
| 6,self_attn.v_proj,0.0004701561,0.05000,2.967 | |
| 6,self_attn.o_proj,0.0000197424,0.05000,2.971 | |
| 6,self_attn.q_proj,0.0004479539,0.05000,2.978 | |
| 7,mlp.gate_proj,0.0004007839,0.05000,2.286 | |
| 7,mlp.up_proj,0.0003775676,0.05000,2.296 | |
| 7,mlp.down_proj,0.0000831422,0.05000,4.269 | |
| 7,self_attn.v_proj,0.0004479891,0.05000,2.972 | |
| 7,self_attn.k_proj,0.0004960482,0.05000,2.976 | |
| 7,self_attn.o_proj,0.0000231072,0.05000,2.987 | |
| 7,self_attn.q_proj,0.0004075726,0.05000,3.002 | |
| 8,mlp.gate_proj,0.0004199805,0.05000,2.241 | |
| 8,mlp.up_proj,0.0003827202,0.05000,2.252 | |
| 8,mlp.down_proj,0.0000806122,0.05000,4.217 | |
| 8,self_attn.o_proj,0.0000282768,0.05000,2.942 | |
| 8,self_attn.k_proj,0.0003548440,0.05000,2.965 | |
| 8,self_attn.q_proj,0.0002887637,0.05000,2.968 | |
| 8,self_attn.v_proj,0.0003144249,0.05000,2.971 | |
| 9,mlp.up_proj,0.0004275542,0.05000,2.253 | |
| 9,mlp.gate_proj,0.0004483688,0.05000,2.277 | |
| 9,mlp.down_proj,0.0000917930,0.05000,4.220 | |
| 9,self_attn.o_proj,failsafe(rtn): 0.0020905,0.00000,0.096 | |
| 9,self_attn.q_proj,0.0003104543,0.05000,1.862 | |
| 9,self_attn.k_proj,0.0000298692,0.05000,1.899 | |
| 9,self_attn.v_proj,0.0000192573,0.05000,1.908 | |
| 9,self_attn.o_gate,0.0002176093,0.05000,0.682 | |
| 10,mlp.gate_proj,0.0004568409,0.05000,2.205 | |
| 10,mlp.up_proj,0.0004427440,0.05000,2.217 | |
| 10,mlp.down_proj,0.0000954703,0.05000,4.187 | |
| 10,self_attn.k_proj,0.0004902110,0.05000,2.916 | |
| 10,self_attn.o_proj,0.0000268956,0.05000,2.940 | |
| 10,self_attn.v_proj,0.0004185948,0.05000,2.938 | |
| 10,self_attn.q_proj,0.0003916300,0.05000,2.948 | |
| 11,mlp.gate_proj,0.0004498163,0.05000,2.247 | |
| 11,mlp.up_proj,0.0004506100,0.05000,2.253 | |
| 11,mlp.down_proj,0.0001055010,0.05000,4.199 | |
| 11,self_attn.o_proj,0.0000336047,0.05000,2.939 | |
| 11,self_attn.k_proj,0.0003669561,0.05000,2.961 | |
| 11,self_attn.q_proj,0.0003018973,0.05000,2.962 | |
| 11,self_attn.v_proj,0.0003209998,0.05000,2.972 | |
| 12,mlp.gate_proj,0.0004327574,0.05000,2.213 | |
| 12,mlp.up_proj,0.0004422537,0.05000,2.217 | |
| 12,mlp.down_proj,0.0001064665,0.05000,4.192 | |
| 12,self_attn.v_proj,0.0004453515,0.05000,2.944 | |
| 12,self_attn.o_proj,0.0000352719,0.05000,2.979 | |
| 12,self_attn.k_proj,0.0004201830,0.05000,2.981 | |
| 12,self_attn.q_proj,0.0003819695,0.05000,2.988 | |
| 13,mlp.gate_proj,0.0004411680,0.05000,2.227 | |
| 13,mlp.up_proj,0.0004594676,0.05000,2.245 | |
| 13,mlp.down_proj,0.0001125713,0.05000,4.201 | |
| 13,self_attn.k_proj,0.0003719480,0.05000,2.953 | |
| 13,self_attn.q_proj,0.0002933697,0.05000,2.958 | |
| 13,self_attn.o_proj,0.0000378701,0.05000,2.967 | |
| 13,self_attn.v_proj,0.0003008936,0.05000,2.972 | |
| 14,mlp.up_proj,0.0004567529,0.05000,2.222 | |
| 14,mlp.gate_proj,0.0004159348,0.05000,2.229 | |
| 14,mlp.down_proj,0.0001232001,0.05000,4.221 | |
| 14,self_attn.v_proj,0.0003152674,0.05000,2.970 | |
| 14,self_attn.k_proj,0.0003643389,0.05000,2.979 | |
| 14,self_attn.o_proj,0.0000488049,0.05000,2.986 | |
| 14,self_attn.q_proj,0.0003182178,0.05000,2.995 | |
| 15,mlp.gate_proj,0.0004251173,0.05000,2.245 | |
| 15,mlp.up_proj,0.0004365050,0.05000,2.267 | |
| 15,mlp.down_proj,0.0001079347,0.05000,4.219 | |
| 15,self_attn.o_proj,0.0000538964,0.05000,2.989 | |
| 15,self_attn.q_proj,0.0002091318,0.05000,2.989 | |
| 15,self_attn.k_proj,0.0002680496,0.05000,3.005 | |
| 15,self_attn.v_proj,0.0002225171,0.05000,3.007 | |
| 16,mlp.gate_proj,0.0004919633,0.05000,2.233 | |
| 16,mlp.up_proj,0.0004810785,0.05000,2.243 | |
| 16,mlp.down_proj,0.0001137119,0.05000,4.214 | |
| 16,self_attn.o_proj,failsafe(rtn): 0.0021057,0.00000,0.093 | |
| 16,self_attn.q_proj,0.0002824569,0.05000,1.913 | |
| 16,self_attn.k_proj,0.0000275908,0.05000,1.953 | |
| 16,self_attn.v_proj,0.0000157489,0.05000,1.959 | |
| 16,self_attn.o_gate,0.0001650757,0.05000,0.685 | |
| 17,mlp.gate_proj,0.0006046007,0.05000,2.274 | |
| 17,mlp.up_proj,0.0005510266,0.05000,2.278 | |
| 17,mlp.down_proj,0.0001312016,0.05000,4.237 | |
| 17,self_attn.o_proj,failsafe(rtn): 0.0021667,0.00000,0.095 | |
| 17,self_attn.v_proj,0.0000211678,0.05000,1.952 | |
| 17,self_attn.q_proj,0.0002673185,0.05000,1.956 | |
| 17,self_attn.k_proj,0.0000233761,0.05000,1.957 | |
| 17,self_attn.o_gate,0.0001793043,0.05000,0.664 | |
| 18,mlp.gate_proj,0.0005101996,0.05000,2.268 | |
| 18,mlp.up_proj,0.0004910317,0.05000,2.275 | |
| 18,mlp.down_proj,0.0001133975,0.05000,4.259 | |
| 18,self_attn.k_proj,0.0003468973,0.05000,3.016 | |
| 18,self_attn.q_proj,0.0002466309,0.05000,3.017 | |
| 18,self_attn.v_proj,0.0002493278,0.05000,3.018 | |
| 18,self_attn.o_proj,0.0000382910,0.05000,3.025 | |
| 19,mlp.up_proj,0.0005109639,0.05000,2.235 | |
| 19,mlp.gate_proj,0.0005002263,0.05000,2.248 | |
| 19,mlp.down_proj,0.0001398108,0.05000,4.201 | |
| 19,self_attn.v_proj,0.0003389656,0.05000,2.989 | |
| 19,self_attn.o_proj,0.0000379808,0.05000,2.998 | |
| 19,self_attn.k_proj,0.0004178796,0.05000,3.007 | |
| 19,self_attn.q_proj,0.0003216561,0.05000,3.009 | |
| 20,mlp.gate_proj,0.0004956775,0.05000,2.259 | |
| 20,mlp.up_proj,0.0005236415,0.05000,2.277 | |
| 20,mlp.down_proj,0.0001796744,0.05000,4.276 | |
| 20,self_attn.k_proj,0.0003484510,0.05000,2.954 | |
| 20,self_attn.o_proj,0.0000471986,0.05000,2.978 | |
| 20,self_attn.q_proj,0.0002609500,0.05000,2.984 | |
| 20,self_attn.v_proj,0.0002615071,0.05000,2.988 | |
| 21,mlp.up_proj,0.0004994372,0.05000,2.266 | |
| 21,mlp.gate_proj,0.0004645316,0.05000,2.279 | |
| 21,mlp.down_proj,0.0001949108,0.05000,4.216 | |
| 21,self_attn.o_proj,0.0000766465,0.05000,2.947 | |
| 21,self_attn.k_proj,0.0003074293,0.05000,2.964 | |
| 21,self_attn.v_proj,0.0002903706,0.05000,2.972 | |
| 21,self_attn.q_proj,0.0002707347,0.05000,2.985 | |
| 22,mlp.up_proj,0.0005572754,0.05000,2.241 | |
| 22,mlp.gate_proj,0.0005191818,0.05000,2.251 | |
| 22,mlp.down_proj,0.0002569589,0.05000,4.209 | |
| 22,self_attn.o_proj,failsafe(rtn): 0.0022430,0.00000,0.097 | |
| 22,self_attn.q_proj,0.0003143768,0.05000,1.880 | |
| 22,self_attn.v_proj,0.0000350399,0.05000,1.934 | |
| 22,self_attn.k_proj,0.0000201146,0.05000,1.937 | |
| 22,self_attn.o_gate,0.0001670687,0.05000,0.694 | |
| 23,mlp.gate_proj,0.0006545052,0.05000,2.243 | |
| 23,mlp.up_proj,0.0007033021,0.05000,2.269 | |
| 23,mlp.down_proj,0.0003489952,0.05000,4.253 | |
| 23,self_attn.k_proj,0.0004181162,0.05000,2.954 | |
| 23,self_attn.o_proj,0.0000832773,0.05000,2.971 | |
| 23,self_attn.v_proj,0.0003177291,0.05000,2.977 | |
| 23,self_attn.q_proj,0.0003282850,0.05000,2.982 | |
| 24,mlp.up_proj,0.0008537005,0.05000,2.230 | |
| 24,mlp.gate_proj,0.0007880767,0.05000,2.232 | |
| 24,mlp.down_proj,0.0005990605,0.05000,4.180 | |
| 24,self_attn.v_proj,0.0002949304,0.05000,2.968 | |
| 24,self_attn.o_proj,0.0001388657,0.05000,2.976 | |
| 24,self_attn.k_proj,0.0003589880,0.05000,2.980 | |
| 24,self_attn.q_proj,0.0002897804,0.05000,2.987 | |
| 25,mlp.up_proj,0.0010665684,0.05000,2.279 | |
| 25,mlp.gate_proj,0.0009695012,0.05000,2.303 | |
| 25,mlp.down_proj,0.0012033481,0.05000,4.299 | |
| 25,self_attn.q_proj,0.0003202692,0.05000,3.038 | |
| 25,self_attn.v_proj,0.0003170714,0.05000,3.044 | |
| 25,self_attn.k_proj,0.0004045218,0.05000,3.050 | |
| 25,self_attn.o_proj,0.0002387067,0.05000,3.056 | |
| 26,mlp.gate_proj,0.0011789015,0.05000,2.229 | |
| 26,mlp.up_proj,0.0013343961,0.05000,2.231 | |
| 26,mlp.down_proj,0.0012957208,0.05000,4.189 | |
| 26,self_attn.v_proj,0.0005397718,0.05000,2.993 | |
| 26,self_attn.k_proj,0.0007869309,0.05000,2.998 | |
| 26,self_attn.q_proj,0.0005534603,0.05000,3.002 | |
| 26,self_attn.o_proj,0.0003255277,0.05000,3.005 | |
| 27,mlp.gate_proj,0.0014277064,0.05000,2.236 | |
| 27,mlp.up_proj,0.0016455295,0.05000,2.244 | |
| 27,mlp.down_proj,0.0018334716,0.05000,4.234 | |
| 27,self_attn.q_proj,0.0005332203,0.05000,2.963 | |
| 27,self_attn.k_proj,0.0005839887,0.05000,2.986 | |
| 27,self_attn.o_proj,0.0002868529,0.05000,2.990 | |
| 27,self_attn.v_proj,0.0005005180,0.05000,2.992 | |
| 28,mlp.gate_proj,0.0016861837,0.05000,2.239 | |
| 28,mlp.up_proj,0.0019899982,0.05000,2.241 | |
| 28,mlp.down_proj,0.0026588713,0.05000,4.218 | |
| 28,self_attn.o_proj,0.0006112322,0.05000,2.959 | |
| 28,self_attn.v_proj,0.0006634702,0.05000,2.966 | |
| 28,self_attn.q_proj,0.0006475543,0.05000,2.974 | |
| 28,self_attn.k_proj,0.0008862655,0.05000,2.979 | |
| 29,mlp.up_proj,0.0023868852,0.05000,2.207 | |
| 29,mlp.gate_proj,0.0019635770,0.05000,2.226 | |
| 29,mlp.down_proj,0.0040410448,0.05000,4.184 | |
| 29,self_attn.o_proj,failsafe(rtn): 0.0025024,0.00000,0.096 | |
| 29,self_attn.v_proj,0.0003332496,0.05000,1.887 | |
| 29,self_attn.q_proj,0.0006649810,0.05000,1.893 | |
| 29,self_attn.k_proj,0.0000341535,0.05000,1.914 | |
| 29,self_attn.o_gate,0.0007388184,0.05000,0.671 | |
| 30,mlp.gate_proj,0.0023512461,0.05000,2.307 | |
| 30,mlp.up_proj,0.0028388989,0.05000,2.311 | |
| 30,mlp.down_proj,0.0072114535,0.05000,4.253 | |
| 30,self_attn.o_proj,failsafe(rtn): 0.0025940,0.00000,0.095 | |
| 30,self_attn.q_proj,0.0009433583,0.05000,1.881 | |
| 30,self_attn.k_proj,0.0000368395,0.05000,1.918 | |
| 30,self_attn.v_proj,0.0009590490,0.05000,1.928 | |
| 30,self_attn.o_gate,0.0010863988,0.05000,0.685 | |
| 31,mlp.up_proj,0.0045522041,0.05000,2.238 | |
| 31,mlp.gate_proj,0.0040763969,0.05000,2.246 | |
| 31,mlp.down_proj,0.0283701427,0.05000,4.203 | |
| 31,self_attn.o_proj,failsafe(rtn): 0.0024261,0.00000,0.096 | |
| 31,self_attn.q_proj,0.0007958777,0.05000,1.886 | |
| 31,self_attn.v_proj,0.0001906893,0.05000,1.936 | |
| 31,self_attn.k_proj,0.0000291729,0.05000,1.937 | |
| 31,self_attn.o_gate,0.0008476649,0.05000,0.697 | |