|
layer,module,loss,samples,damp,time
|
|
0,self_attn.k_proj,8.41861439,0.01000,0.664
|
|
0,self_attn.v_proj,0.21005458,0.01000,0.469
|
|
0,self_attn.q_proj,17.33579826,0.01000,0.474
|
|
0,self_attn.o_proj,0.02386058,0.01000,0.475
|
|
0,mlp.up_proj,14.27135086,0.01000,0.479
|
|
0,mlp.gate_proj,18.06971550,0.01000,0.475
|
|
0,mlp.down_proj,0.14194207,0.01000,2.035
|
|
1,self_attn.k_proj,16.61663818,0.01000,0.477
|
|
1,self_attn.v_proj,0.92205977,0.01000,0.473
|
|
1,self_attn.q_proj,31.15385056,0.01000,0.477
|
|
1,self_attn.o_proj,0.08981550,0.01000,0.478
|
|
1,mlp.up_proj,22.96321106,0.01000,0.482
|
|
1,mlp.gate_proj,31.65004921,0.01000,0.482
|
|
1,mlp.down_proj,38.26826477,0.01000,2.005
|
|
2,self_attn.k_proj,24.22631836,0.01000,0.480
|
|
2,self_attn.v_proj,1.67933977,0.01000,0.479
|
|
2,self_attn.q_proj,48.14019012,0.01000,0.484
|
|
2,self_attn.o_proj,0.06455882,0.01000,0.515
|
|
2,mlp.up_proj,25.73600769,0.01000,0.480
|
|
2,mlp.gate_proj,41.05938721,0.01000,0.484
|
|
2,mlp.down_proj,0.33432978,0.01000,2.083
|
|
3,self_attn.k_proj,18.33634377,0.01000,0.475
|
|
3,self_attn.v_proj,2.41345811,0.01000,0.476
|
|
3,self_attn.q_proj,40.40703964,0.01000,0.473
|
|
3,self_attn.o_proj,0.13487279,0.01000,0.474
|
|
3,mlp.up_proj,33.06004333,0.01000,0.484
|
|
3,mlp.gate_proj,65.55947113,0.01000,0.486
|
|
3,mlp.down_proj,0.46528998,0.01000,2.138
|
|
4,self_attn.k_proj,20.85830688,0.01000,0.471
|
|
4,self_attn.v_proj,2.46677113,0.01000,0.470
|
|
4,self_attn.q_proj,43.79531097,0.01000,0.473
|
|
4,self_attn.o_proj,0.20654257,0.01000,0.472
|
|
4,mlp.up_proj,35.62884521,0.01000,0.479
|
|
4,mlp.gate_proj,76.35075378,0.01000,0.480
|
|
4,mlp.down_proj,0.52896929,0.01000,2.007
|
|
5,self_attn.k_proj,30.95933533,0.01000,0.474
|
|
5,self_attn.v_proj,2.18834066,0.01000,0.472
|
|
5,self_attn.q_proj,55.54789734,0.01000,0.473
|
|
5,self_attn.o_proj,0.23475912,0.01000,0.471
|
|
5,mlp.up_proj,38.36640930,0.01000,0.483
|
|
5,mlp.gate_proj,70.71673584,0.01000,0.483
|
|
5,mlp.down_proj,0.60111052,0.01000,2.088
|
|
6,self_attn.k_proj,28.12816238,0.01000,0.472
|
|
6,self_attn.v_proj,2.95645475,0.01000,0.472
|
|
6,self_attn.q_proj,43.80027008,0.01000,0.475
|
|
6,self_attn.o_proj,0.30947250,0.01000,0.475
|
|
6,mlp.up_proj,39.52988815,0.01000,0.481
|
|
6,mlp.gate_proj,71.26806641,0.01000,0.482
|
|
6,mlp.down_proj,0.64987046,0.01000,2.019
|
|
7,self_attn.k_proj,29.06768417,0.01000,0.476
|
|
7,self_attn.v_proj,3.53601265,0.01000,0.475
|
|
7,self_attn.q_proj,54.38722992,0.01000,0.474
|
|
7,self_attn.o_proj,0.32754090,0.01000,0.476
|
|
7,mlp.up_proj,43.67794800,0.01000,0.484
|
|
7,mlp.gate_proj,70.55415344,0.01000,0.520
|
|
7,mlp.down_proj,0.72607958,0.01000,2.017
|
|
8,self_attn.k_proj,35.41775131,0.01000,0.474
|
|
8,self_attn.v_proj,3.54361200,0.01000,0.471
|
|
8,self_attn.q_proj,58.69980240,0.01000,0.472
|
|
8,self_attn.o_proj,0.35979411,0.01000,0.473
|
|
8,mlp.up_proj,50.27742386,0.01000,0.482
|
|
8,mlp.gate_proj,78.67279816,0.01000,0.491
|
|
8,mlp.down_proj,0.90459943,0.01000,2.014
|
|
9,self_attn.k_proj,29.37892342,0.01000,0.475
|
|
9,self_attn.v_proj,4.25876951,0.01000,0.473
|
|
9,self_attn.q_proj,71.52907562,0.01000,0.477
|
|
9,self_attn.o_proj,0.65946442,0.01000,0.475
|
|
9,mlp.up_proj,56.33892059,0.01000,0.489
|
|
9,mlp.gate_proj,91.16986084,0.01000,0.488
|
|
9,mlp.down_proj,1.11940432,0.01000,2.018
|
|
10,self_attn.k_proj,36.32312393,0.01000,0.475
|
|
10,self_attn.v_proj,4.55427074,0.01000,0.473
|
|
10,self_attn.q_proj,76.70331573,0.01000,0.502
|
|
10,self_attn.o_proj,0.59689677,0.01000,0.504
|
|
10,mlp.up_proj,70.09442139,0.01000,0.495
|
|
10,mlp.gate_proj,109.52536011,0.01000,0.497
|
|
10,mlp.down_proj,1.58390236,0.01000,2.075
|
|
11,self_attn.k_proj,44.06135941,0.01000,0.472
|
|
11,self_attn.v_proj,4.79146576,0.01000,0.480
|
|
11,self_attn.q_proj,76.30178070,0.01000,0.471
|
|
11,self_attn.o_proj,0.46545687,0.01000,0.477
|
|
11,mlp.up_proj,83.08464050,0.01000,0.513
|
|
11,mlp.gate_proj,127.38317871,0.01000,0.479
|
|
11,mlp.down_proj,2.11763573,0.01000,2.019
|
|
12,self_attn.k_proj,43.86377716,0.01000,0.475
|
|
12,self_attn.v_proj,5.06729603,0.01000,0.477
|
|
12,self_attn.q_proj,79.52319336,0.01000,0.474
|
|
12,self_attn.o_proj,0.51790261,0.01000,0.475
|
|
12,mlp.up_proj,94.49747467,0.01000,0.481
|
|
12,mlp.gate_proj,137.43954468,0.01000,0.480
|
|
12,mlp.down_proj,2.97385502,0.01000,2.009
|
|
13,self_attn.k_proj,46.23298645,0.01000,0.474
|
|
13,self_attn.v_proj,8.45674324,0.01000,0.474
|
|
13,self_attn.q_proj,92.02006531,0.01000,0.480
|
|
13,self_attn.o_proj,0.83154112,0.01000,0.475
|
|
13,mlp.up_proj,113.46607971,0.01000,0.490
|
|
13,mlp.gate_proj,151.12004089,0.01000,0.485
|
|
13,mlp.down_proj,4.34957981,0.01000,2.005
|
|
14,self_attn.k_proj,45.50234222,0.01000,0.472
|
|
14,self_attn.v_proj,16.00457764,0.01000,0.472
|
|
14,self_attn.q_proj,90.30409241,0.01000,0.474
|
|
14,self_attn.o_proj,2.08878922,0.01000,0.478
|
|
14,mlp.up_proj,125.47468567,0.01000,0.484
|
|
14,mlp.gate_proj,180.86888123,0.01000,0.484
|
|
14,mlp.down_proj,5.17438221,0.01000,2.016
|
|
15,self_attn.k_proj,40.97031403,0.01000,0.474
|
|
15,self_attn.v_proj,17.49190903,0.01000,0.474
|
|
15,self_attn.q_proj,84.56118774,0.01000,0.476
|
|
15,self_attn.o_proj,4.40056229,0.01000,0.476
|
|
15,mlp.up_proj,159.97250366,0.01000,0.489
|
|
15,mlp.gate_proj,213.08778381,0.01000,0.481
|
|
15,mlp.down_proj,12.76450062,0.01000,2.024
|
|
|