Abdohaaland's picture
Upload folder using huggingface_hub
c72312f verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000000529,0.05000,5.639
0,self_attn.v_proj,0.0000000459,0.05000,5.749
0,self_attn.q_proj,0.0000001946,0.05000,5.781
0,self_attn.o_proj,0.0000001205,0.05000,1.680
0,mlp.gate_proj,0.0000119312,0.05000,2.209
0,mlp.up_proj,0.0000104520,0.05000,2.237
0,mlp.down_proj,0.0000016241,0.05000,3.944
1,self_attn.q_proj,0.0000003163,0.05000,5.104
1,self_attn.v_proj,0.0000000882,0.05000,5.167
1,self_attn.k_proj,0.0000000853,0.05000,5.201
1,self_attn.o_proj,0.0000001642,0.05000,1.658
1,mlp.up_proj,0.0001817668,0.05000,2.850
1,mlp.gate_proj,0.0004014041,0.05000,2.881
1,mlp.down_proj,0.0000017688,0.05000,4.370
2,self_attn.q_proj,0.0000008970,0.05000,5.286
2,self_attn.k_proj,0.0000002566,0.05000,5.321
2,self_attn.v_proj,0.0000002510,0.05000,5.343
2,self_attn.o_proj,0.0000002251,0.05000,1.713
2,mlp.gate_proj,0.0006498467,0.05000,2.413
2,mlp.up_proj,0.0005177948,0.05000,2.438
2,mlp.down_proj,0.0000012732,0.05000,4.137
3,self_attn.q_proj,0.0000017194,0.05000,4.685
3,self_attn.k_proj,0.0000004413,0.05000,4.758
3,self_attn.v_proj,0.0000004548,0.05000,4.772
3,self_attn.o_proj,0.0000003429,0.05000,1.565
3,mlp.gate_proj,0.0006881107,0.05000,2.288
3,mlp.up_proj,0.0003561646,0.05000,2.318
3,mlp.down_proj,0.0000036292,0.05000,4.141
4,self_attn.v_proj,0.0000008922,0.05000,4.747
4,self_attn.q_proj,0.0000032643,0.05000,4.819
4,self_attn.k_proj,0.0000008853,0.05000,4.835
4,self_attn.o_proj,0.0000005458,0.05000,1.590
4,mlp.gate_proj,0.0005724557,0.05000,2.200
4,mlp.up_proj,0.0002293439,0.05000,2.225
4,mlp.down_proj,0.0000055330,0.05000,4.094
5,self_attn.q_proj,0.0000035649,0.05000,4.698
5,self_attn.v_proj,0.0000009740,0.05000,4.701
5,self_attn.k_proj,0.0000009058,0.05000,4.750
5,self_attn.o_proj,0.0000009772,0.05000,1.573
5,mlp.gate_proj,0.0002079280,0.05000,2.225
5,mlp.up_proj,0.0001013186,0.05000,2.242
5,mlp.down_proj,0.0000081773,0.05000,4.052
6,self_attn.v_proj,0.0000020665,0.05000,4.633
6,self_attn.k_proj,0.0000018139,0.05000,4.651
6,self_attn.q_proj,0.0000076765,0.05000,4.707
6,self_attn.o_proj,0.0000023579,0.05000,1.543
6,mlp.gate_proj,0.0002195186,0.05000,2.175
6,mlp.up_proj,0.0001256842,0.05000,2.209
6,mlp.down_proj,0.0001805787,0.05000,4.051
7,self_attn.k_proj,0.0000041912,0.05000,4.737
7,self_attn.q_proj,0.0000155375,0.05000,4.792
7,self_attn.v_proj,0.0000043051,0.05000,4.791
7,self_attn.o_proj,0.0000028798,0.05000,1.601
7,mlp.up_proj,0.0001527545,0.05000,2.254
7,mlp.gate_proj,0.0002531733,0.05000,2.284
7,mlp.down_proj,0.0000135267,0.05000,4.097
8,self_attn.k_proj,0.0000061028,0.05000,4.791
8,self_attn.v_proj,0.0000066735,0.05000,4.804
8,self_attn.q_proj,0.0000235807,0.05000,4.855
8,self_attn.o_proj,0.0000041072,0.05000,1.567
8,mlp.up_proj,0.0001451299,0.05000,2.221
8,mlp.gate_proj,0.0001770070,0.05000,2.239
8,mlp.down_proj,0.0000203039,0.05000,4.053
9,self_attn.q_proj,0.0000290558,0.05000,4.707
9,self_attn.v_proj,0.0000080488,0.05000,4.772
9,self_attn.k_proj,0.0000081565,0.05000,4.789
9,self_attn.o_proj,0.0000045795,0.05000,1.552
9,mlp.up_proj,0.0001810021,0.05000,2.156
9,mlp.gate_proj,0.0002832804,0.05000,2.183
9,mlp.down_proj,0.0000204025,0.05000,4.116
10,self_attn.q_proj,0.0000428730,0.05000,4.681
10,self_attn.k_proj,0.0000110682,0.05000,4.728
10,self_attn.v_proj,0.0000127939,0.05000,4.753
10,self_attn.o_proj,0.0000070710,0.05000,1.515
10,mlp.gate_proj,0.0002172222,0.05000,2.220
10,mlp.up_proj,0.0001513125,0.05000,2.218
10,mlp.down_proj,0.0000166309,0.05000,4.037
11,self_attn.k_proj,0.0000055936,0.05000,4.616
11,self_attn.q_proj,0.0000206081,0.05000,4.677
11,self_attn.v_proj,0.0000057883,0.05000,4.701
11,self_attn.o_proj,0.0000043435,0.05000,1.481
11,mlp.up_proj,0.0001400455,0.05000,2.178
11,mlp.gate_proj,0.0001772193,0.05000,2.182
11,mlp.down_proj,0.0000154659,0.05000,4.043
12,self_attn.k_proj,0.0000063814,0.05000,4.536
12,self_attn.q_proj,0.0000242027,0.05000,4.576
12,self_attn.v_proj,0.0000068583,0.05000,4.605
12,self_attn.o_proj,0.0000050332,0.05000,1.562
12,mlp.up_proj,0.0001370627,0.05000,2.161
12,mlp.gate_proj,0.0001573160,0.05000,2.180
12,mlp.down_proj,0.0000155309,0.05000,3.970
13,self_attn.v_proj,0.0000047044,0.05000,4.507
13,self_attn.q_proj,0.0000184363,0.05000,4.572
13,self_attn.k_proj,0.0000048823,0.05000,4.595
13,self_attn.o_proj,0.0000040465,0.05000,1.519
13,mlp.up_proj,0.0001393028,0.05000,2.214
13,mlp.gate_proj,0.0001458737,0.05000,2.229
13,mlp.down_proj,0.0000165562,0.05000,3.984
14,self_attn.k_proj,0.0000078433,0.05000,4.434
14,self_attn.v_proj,0.0000083064,0.05000,4.512
14,self_attn.q_proj,0.0000305769,0.05000,4.529
14,self_attn.o_proj,0.0000068696,0.05000,1.534
14,mlp.gate_proj,0.0001425182,0.05000,2.143
14,mlp.up_proj,0.0001369667,0.05000,2.165
14,mlp.down_proj,0.0000144339,0.05000,3.994
15,self_attn.k_proj,0.0000078901,0.05000,4.457
15,self_attn.q_proj,0.0000304238,0.05000,4.517
15,self_attn.v_proj,0.0000075067,0.05000,4.547
15,self_attn.o_proj,0.0000057910,0.05000,1.549
15,mlp.gate_proj,0.0001314416,0.05000,2.075
15,mlp.up_proj,0.0001308323,0.05000,2.096
15,mlp.down_proj,0.0000141322,0.05000,4.025
16,self_attn.q_proj,0.0000527059,0.05000,4.588
16,self_attn.k_proj,0.0000129936,0.05000,4.645
16,self_attn.v_proj,0.0000147963,0.05000,4.672
16,self_attn.o_proj,0.0000062181,0.05000,1.554
16,mlp.up_proj,0.0001370881,0.05000,2.170
16,mlp.gate_proj,0.0001460451,0.05000,2.173
16,mlp.down_proj,0.0001291258,0.05000,4.031
17,self_attn.k_proj,0.0000099961,0.05000,4.611
17,self_attn.v_proj,0.0000111945,0.05000,4.684
17,self_attn.q_proj,0.0000450757,0.05000,4.705
17,self_attn.o_proj,0.0000065814,0.05000,1.551
17,mlp.up_proj,0.0001229390,0.05000,2.229
17,mlp.gate_proj,0.0001291509,0.05000,2.260
17,mlp.down_proj,0.0000138228,0.05000,4.005
18,self_attn.q_proj,0.0000491217,0.05000,4.514
18,self_attn.k_proj,0.0000119304,0.05000,4.544
18,self_attn.v_proj,0.0000134876,0.05000,4.585
18,self_attn.o_proj,0.0000080063,0.05000,1.528
18,mlp.up_proj,0.0001347442,0.05000,2.151
18,mlp.gate_proj,0.0001388276,0.05000,2.173
18,mlp.down_proj,0.0000170619,0.05000,4.005
19,self_attn.k_proj,0.0000229575,0.05000,4.624
19,self_attn.q_proj,0.0000984122,0.05000,4.668
19,self_attn.v_proj,0.0000236798,0.05000,4.691
19,self_attn.o_proj,0.0000106329,0.05000,1.582
19,mlp.up_proj,0.0001514618,0.05000,2.286
19,mlp.gate_proj,0.0001546628,0.05000,2.302
19,mlp.down_proj,0.0000227354,0.05000,4.005
20,self_attn.q_proj,0.0000933378,0.05000,4.620
20,self_attn.v_proj,0.0000220575,0.05000,4.667
20,self_attn.k_proj,0.0000202215,0.05000,4.695
20,self_attn.o_proj,0.0000106457,0.05000,1.588
20,mlp.up_proj,0.0001666797,0.05000,2.134
20,mlp.gate_proj,0.0001662707,0.05000,2.132
20,mlp.down_proj,0.0000256278,0.05000,3.855
21,self_attn.q_proj,0.0001202196,0.05000,4.409
21,self_attn.k_proj,0.0000271532,0.05000,4.460
21,self_attn.v_proj,0.0000298576,0.05000,4.463
21,self_attn.o_proj,0.0000127776,0.05000,1.502
21,mlp.gate_proj,0.0002019959,0.05000,2.158
21,mlp.up_proj,0.0002010829,0.05000,2.176
21,mlp.down_proj,0.0000345897,0.05000,3.940
22,self_attn.k_proj,0.0000543410,0.05000,4.310
22,self_attn.v_proj,0.0000614177,0.05000,4.389
22,self_attn.q_proj,0.0002431058,0.05000,4.428
22,self_attn.o_proj,0.0000251777,0.05000,1.475
22,mlp.gate_proj,0.0002430665,0.05000,2.006
22,mlp.up_proj,0.0002305638,0.05000,2.024
22,mlp.down_proj,0.0000551142,0.05000,4.117
23,self_attn.k_proj,0.0000548529,0.05000,4.693
23,self_attn.q_proj,0.0002422710,0.05000,4.733
23,self_attn.v_proj,0.0000634447,0.05000,4.766
23,self_attn.o_proj,0.0000301494,0.05000,1.571
23,mlp.up_proj,0.0002738696,0.05000,2.283
23,mlp.gate_proj,0.0003045300,0.05000,2.310
23,mlp.down_proj,0.0000784298,0.05000,4.072
24,self_attn.v_proj,0.0001179669,0.05000,4.527
24,self_attn.k_proj,0.0000914282,0.05000,4.581
24,self_attn.q_proj,0.0003977864,0.05000,4.606
24,self_attn.o_proj,0.0000348926,0.05000,1.539
24,mlp.up_proj,0.0003071852,0.05000,2.174
24,mlp.gate_proj,0.0003468198,0.05000,2.199
24,mlp.down_proj,0.0000987934,0.05000,4.011
25,self_attn.k_proj,0.0000689053,0.05000,4.630
25,self_attn.q_proj,0.0002806590,0.05000,4.681
25,self_attn.v_proj,0.0000781839,0.05000,4.700
25,self_attn.o_proj,0.0000216056,0.05000,1.567
25,mlp.gate_proj,0.0004061265,0.05000,2.350
25,mlp.up_proj,0.0003546657,0.05000,2.372
25,mlp.down_proj,0.0001193259,0.05000,4.131
26,self_attn.q_proj,0.0004597529,0.05000,4.504
26,self_attn.v_proj,0.0001259534,0.05000,4.592
26,self_attn.k_proj,0.0001063583,0.05000,4.603
26,self_attn.o_proj,0.0000202876,0.05000,1.588
26,mlp.up_proj,0.0004417255,0.05000,2.244
26,mlp.gate_proj,0.0004897194,0.05000,2.276
26,mlp.down_proj,0.0001446874,0.05000,4.001
27,self_attn.v_proj,0.0001698991,0.05000,4.541
27,self_attn.q_proj,0.0005717810,0.05000,4.596
27,self_attn.k_proj,0.0001285193,0.05000,4.611
27,self_attn.o_proj,0.0000299984,0.05000,1.533
27,mlp.up_proj,0.0005171644,0.05000,2.243
27,mlp.gate_proj,0.0005543040,0.05000,2.272
27,mlp.down_proj,0.0002140129,0.05000,4.063
28,self_attn.q_proj,0.0006321518,0.05000,4.605
28,self_attn.v_proj,0.0001818466,0.05000,4.617
28,self_attn.k_proj,0.0001574352,0.05000,4.603
28,self_attn.o_proj,0.0000483718,0.05000,1.539
28,mlp.gate_proj,0.0006389360,0.05000,2.202
28,mlp.up_proj,0.0006213975,0.05000,2.220
28,mlp.down_proj,0.0003262202,0.05000,4.026
29,self_attn.k_proj,0.0003507194,0.05000,4.563
29,self_attn.v_proj,0.0004741120,0.05000,4.606
29,self_attn.q_proj,0.0015347515,0.05000,4.631
29,self_attn.o_proj,0.0000478133,0.05000,1.528
29,mlp.gate_proj,0.0007606724,0.05000,2.246
29,mlp.up_proj,0.0007786636,0.05000,2.274
29,mlp.down_proj,0.0003562392,0.05000,4.091
30,self_attn.k_proj,0.0004426675,0.05000,4.557
30,self_attn.q_proj,0.0017618013,0.05000,4.629
30,self_attn.v_proj,0.0005607962,0.05000,4.643
30,self_attn.o_proj,0.0000970244,0.05000,1.504
30,mlp.up_proj,0.0008522944,0.05000,2.130
30,mlp.gate_proj,0.0008062162,0.05000,2.169
30,mlp.down_proj,0.0004936067,0.05000,4.025
31,self_attn.v_proj,0.0008217572,0.05000,4.589
31,self_attn.k_proj,0.0005931148,0.05000,4.626
31,self_attn.q_proj,0.0022387475,0.05000,4.661
31,self_attn.o_proj,0.0000931515,0.05000,1.562
31,mlp.up_proj,0.0009072860,0.05000,2.213
31,mlp.gate_proj,0.0008159017,0.05000,2.236
31,mlp.down_proj,0.0006296246,0.05000,4.061
32,self_attn.v_proj,0.0012069424,0.05000,4.608
32,self_attn.k_proj,0.0007966917,0.05000,4.655
32,self_attn.q_proj,0.0032704534,0.05000,4.695
32,self_attn.o_proj,0.0001177748,0.05000,1.529
32,mlp.up_proj,0.0009638389,0.05000,2.166
32,mlp.gate_proj,0.0008459933,0.05000,2.195
32,mlp.down_proj,0.0007726722,0.05000,3.959
33,self_attn.q_proj,0.0068431394,0.05000,4.501
33,self_attn.v_proj,0.0026603756,0.05000,4.515
33,self_attn.k_proj,0.0013990668,0.05000,4.569
33,self_attn.o_proj,0.0001440813,0.05000,1.581
33,mlp.up_proj,0.0010475062,0.05000,2.215
33,mlp.gate_proj,0.0009084458,0.05000,2.241
33,mlp.down_proj,0.0009851406,0.05000,3.856
34,self_attn.k_proj,0.0012023171,0.05000,4.691
34,self_attn.q_proj,0.0053871334,0.05000,4.754
34,self_attn.v_proj,0.0020066263,0.05000,4.756
34,self_attn.o_proj,0.0002732787,0.05000,1.535
34,mlp.gate_proj,0.0010677983,0.05000,2.184
34,mlp.up_proj,0.0011509700,0.05000,2.210
34,mlp.down_proj,0.0011212979,0.05000,4.006
35,self_attn.v_proj,0.0008843137,0.05000,4.681
35,self_attn.q_proj,0.0025782813,0.05000,4.733
35,self_attn.k_proj,0.0006658983,0.05000,4.775
35,self_attn.o_proj,0.0003583769,0.05000,1.576
35,mlp.gate_proj,0.0016682997,0.05000,2.171
35,mlp.up_proj,0.0017624593,0.05000,2.190
35,mlp.down_proj,0.0016827106,0.05000,4.071