8B-instruct-int2 / quant_log.csv
Matt300209's picture
Upload folder using huggingface_hub
e119363 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,11.22799206,0.01000,1.182
0,self_attn.v_proj,0.08241733,0.01000,0.935
0,self_attn.q_proj,17.68160629,0.01000,0.975
0,self_attn.o_proj,0.00721719,0.01000,0.953
0,mlp.up_proj,6.65099096,0.01000,0.966
0,mlp.gate_proj,8.09159565,0.01000,0.967
0,mlp.down_proj,0.03573648,0.01000,4.064
1,self_attn.k_proj,9.22376442,0.01000,0.948
1,self_attn.v_proj,0.28318453,0.01000,0.940
1,self_attn.q_proj,16.18816757,0.01000,0.970
1,self_attn.o_proj,0.02015126,0.01000,0.963
1,mlp.up_proj,13.46427822,0.01000,0.981
1,mlp.gate_proj,16.03173447,0.01000,0.980
1,mlp.down_proj,8.35137749,0.01000,3.998
2,self_attn.k_proj,29.27434731,0.01000,0.944
2,self_attn.v_proj,1.14488220,0.01000,0.953
2,self_attn.q_proj,44.56943512,0.01000,0.961
2,self_attn.o_proj,0.02701145,0.01000,0.964
2,mlp.up_proj,16.96399689,0.01000,0.976
2,mlp.gate_proj,21.46613693,0.01000,0.968
2,mlp.down_proj,0.09852779,0.01000,4.019
3,self_attn.k_proj,26.71245956,0.01000,0.944
3,self_attn.v_proj,2.31728029,0.01000,0.947
3,self_attn.q_proj,47.03275299,0.01000,0.962
3,self_attn.o_proj,0.05190724,0.01000,0.962
3,mlp.up_proj,27.40729141,0.01000,0.976
3,mlp.gate_proj,39.39673615,0.01000,0.972
3,mlp.down_proj,0.22717687,0.01000,4.034
4,self_attn.k_proj,27.54222107,0.01000,0.958
4,self_attn.v_proj,2.55753708,0.01000,0.954
4,self_attn.q_proj,47.58830261,0.01000,1.005
4,self_attn.o_proj,0.11681227,0.01000,0.960
4,mlp.up_proj,35.72327423,0.01000,0.977
4,mlp.gate_proj,58.45260620,0.01000,0.973
4,mlp.down_proj,0.40261966,0.01000,4.039
5,self_attn.k_proj,45.64198685,0.01000,0.954
5,self_attn.v_proj,2.62736511,0.01000,0.936
5,self_attn.q_proj,72.18830872,0.01000,0.958
5,self_attn.o_proj,0.10206828,0.01000,0.956
5,mlp.up_proj,46.87654495,0.01000,0.977
5,mlp.gate_proj,75.59836578,0.01000,0.974
5,mlp.down_proj,0.59073389,0.01000,5.000
6,self_attn.k_proj,41.24952698,0.01000,0.943
6,self_attn.v_proj,3.27706838,0.01000,0.941
6,self_attn.q_proj,72.76811218,0.01000,0.957
6,self_attn.o_proj,0.19349343,0.01000,0.956
6,mlp.up_proj,54.11415100,0.01000,0.982
6,mlp.gate_proj,88.01928711,0.01000,0.977
6,mlp.down_proj,0.75473285,0.01000,3.991
7,self_attn.k_proj,43.62543488,0.01000,0.942
7,self_attn.v_proj,3.61015534,0.01000,0.943
7,self_attn.q_proj,71.84650421,0.01000,0.967
7,self_attn.o_proj,0.24048528,0.01000,0.955
7,mlp.up_proj,57.26372147,0.01000,0.982
7,mlp.gate_proj,87.35131836,0.01000,0.997
7,mlp.down_proj,0.84977585,0.01000,4.009
8,self_attn.k_proj,53.71326065,0.01000,0.945
8,self_attn.v_proj,4.65319824,0.01000,0.956
8,self_attn.q_proj,87.41954041,0.01000,0.969
8,self_attn.o_proj,0.29741907,0.01000,0.961
8,mlp.up_proj,59.96548462,0.01000,0.981
8,mlp.gate_proj,92.74369812,0.01000,0.979
8,mlp.down_proj,0.90413743,0.01000,4.051
9,self_attn.k_proj,53.14421844,0.01000,0.946
9,self_attn.v_proj,6.63929367,0.01000,0.962
9,self_attn.q_proj,89.09582520,0.01000,0.959
9,self_attn.o_proj,0.36242113,0.01000,0.960
9,mlp.up_proj,62.62213135,0.01000,0.982
9,mlp.gate_proj,97.25785828,0.01000,0.977
9,mlp.down_proj,0.94196564,0.01000,4.066
10,self_attn.k_proj,63.22294617,0.01000,0.945
10,self_attn.v_proj,5.22517109,0.01000,0.964
10,self_attn.q_proj,102.96373749,0.01000,0.955
10,self_attn.o_proj,0.32724801,0.01000,0.959
10,mlp.up_proj,65.95198059,0.01000,0.992
10,mlp.gate_proj,95.32070160,0.01000,0.981
10,mlp.down_proj,0.99393255,0.01000,4.061
11,self_attn.k_proj,59.00455856,0.01000,0.949
11,self_attn.v_proj,5.36271477,0.01000,0.970
11,self_attn.q_proj,91.96803284,0.01000,0.960
11,self_attn.o_proj,0.30786622,0.01000,0.984
11,mlp.up_proj,68.84593201,0.01000,0.996
11,mlp.gate_proj,96.15147400,0.01000,0.976
11,mlp.down_proj,1.08279216,0.01000,4.060
12,self_attn.k_proj,45.56399918,0.01000,1.863
12,self_attn.v_proj,6.28582859,0.01000,0.946
12,self_attn.q_proj,79.63566589,0.01000,0.954
12,self_attn.o_proj,0.50937307,0.01000,0.959
12,mlp.up_proj,70.78729248,0.01000,0.983
12,mlp.gate_proj,93.35784912,0.01000,0.981
12,mlp.down_proj,1.21652746,0.01000,3.999
13,self_attn.k_proj,71.59039307,0.01000,0.951
13,self_attn.v_proj,7.24900055,0.01000,0.947
13,self_attn.q_proj,109.80696106,0.01000,0.972
13,self_attn.o_proj,0.47386312,0.01000,0.963
13,mlp.up_proj,76.88529968,0.01000,0.981
13,mlp.gate_proj,101.14041901,0.01000,0.981
13,mlp.down_proj,1.34163332,0.01000,4.006
14,self_attn.k_proj,69.07406616,0.01000,0.945
14,self_attn.v_proj,7.00954533,0.01000,0.941
14,self_attn.q_proj,101.63433838,0.01000,0.964
14,self_attn.o_proj,0.52557290,0.01000,0.980
14,mlp.up_proj,82.75735474,0.01000,0.986
14,mlp.gate_proj,115.41607666,0.01000,0.977
14,mlp.down_proj,1.69118094,0.01000,3.992
15,self_attn.k_proj,64.91668701,0.01000,0.947
15,self_attn.v_proj,8.43104744,0.01000,0.964
15,self_attn.q_proj,122.26741028,0.01000,0.962
15,self_attn.o_proj,0.90873456,0.01000,0.962
15,mlp.up_proj,89.97241211,0.01000,0.981
15,mlp.gate_proj,132.03938293,0.01000,0.975
15,mlp.down_proj,1.97122192,0.01000,4.009
16,self_attn.k_proj,65.04678345,0.01000,0.947
16,self_attn.v_proj,7.19157934,0.01000,0.945
16,self_attn.q_proj,107.82556152,0.01000,0.978
16,self_attn.o_proj,0.65170872,0.01000,0.953
16,mlp.up_proj,96.36511993,0.01000,0.976
16,mlp.gate_proj,150.15841675,0.01000,0.985
16,mlp.down_proj,2.30560780,0.01000,3.990
17,self_attn.k_proj,69.76232910,0.01000,0.963
17,self_attn.v_proj,8.55681229,0.01000,0.948
17,self_attn.q_proj,116.39646912,0.01000,0.964
17,self_attn.o_proj,0.67663085,0.01000,0.966
17,mlp.up_proj,101.97552490,0.01000,0.975
17,mlp.gate_proj,162.89520264,0.01000,0.971
17,mlp.down_proj,2.62797785,0.01000,4.030
18,self_attn.k_proj,75.70587921,0.01000,0.944
18,self_attn.v_proj,7.88881063,0.01000,0.936
18,self_attn.q_proj,114.46511078,0.01000,0.962
18,self_attn.o_proj,0.36577821,0.01000,0.980
18,mlp.up_proj,104.14845276,0.01000,1.000
18,mlp.gate_proj,167.79486084,0.01000,0.973
18,mlp.down_proj,2.61285210,0.01000,4.049
19,self_attn.k_proj,67.59603119,0.01000,0.942
19,self_attn.v_proj,8.80168056,0.01000,0.946
19,self_attn.q_proj,114.31557465,0.01000,0.967
19,self_attn.o_proj,0.41099533,0.01000,0.962
19,mlp.up_proj,106.79249573,0.01000,0.984
19,mlp.gate_proj,175.17819214,0.01000,0.979
19,mlp.down_proj,2.83008838,0.01000,4.059
20,self_attn.k_proj,72.29190826,0.01000,0.965
20,self_attn.v_proj,9.52228069,0.01000,0.968
20,self_attn.q_proj,116.65504456,0.01000,0.963
20,self_attn.o_proj,0.43714535,0.01000,0.965
20,mlp.up_proj,114.59677124,0.01000,0.983
20,mlp.gate_proj,186.40408325,0.01000,0.981
20,mlp.down_proj,3.10870957,0.01000,4.054
21,self_attn.k_proj,70.21195221,0.01000,0.949
21,self_attn.v_proj,9.92044544,0.01000,1.272
21,self_attn.q_proj,111.32563782,0.01000,1.627
21,self_attn.o_proj,0.56897962,0.01000,0.965
21,mlp.up_proj,123.46504211,0.01000,0.992
21,mlp.gate_proj,202.37722778,0.01000,0.978
21,mlp.down_proj,3.51300764,0.01000,4.013
22,self_attn.k_proj,73.74209595,0.01000,0.952
22,self_attn.v_proj,11.55185318,0.01000,0.946
22,self_attn.q_proj,111.50030518,0.01000,0.963
22,self_attn.o_proj,0.73004460,0.01000,0.959
22,mlp.up_proj,128.10562134,0.01000,0.984
22,mlp.gate_proj,208.33113098,0.01000,0.982
22,mlp.down_proj,3.44361711,0.01000,3.985
23,self_attn.k_proj,70.65469360,0.01000,0.947
23,self_attn.v_proj,12.61018848,0.01000,0.942
23,self_attn.q_proj,114.58131409,0.01000,0.953
23,self_attn.o_proj,0.69253051,0.01000,0.963
23,mlp.up_proj,134.70356750,0.01000,0.984
23,mlp.gate_proj,217.82183838,0.01000,0.981
23,mlp.down_proj,3.65843129,0.01000,4.019
24,self_attn.k_proj,70.22497559,0.01000,0.945
24,self_attn.v_proj,15.94941235,0.01000,0.946
24,self_attn.q_proj,117.30754089,0.01000,0.972
24,self_attn.o_proj,0.92370832,0.01000,0.964
24,mlp.up_proj,144.46540833,0.01000,0.983
24,mlp.gate_proj,233.56280518,0.01000,1.005
24,mlp.down_proj,4.04376507,0.01000,4.057
25,self_attn.k_proj,66.74045563,0.01000,0.946
25,self_attn.v_proj,16.83852959,0.01000,0.942
25,self_attn.q_proj,118.24900818,0.01000,0.955
25,self_attn.o_proj,1.22937059,0.01000,0.963
25,mlp.up_proj,153.07160950,0.01000,0.980
25,mlp.gate_proj,247.25921631,0.01000,0.977
25,mlp.down_proj,4.54436493,0.01000,3.983
26,self_attn.k_proj,72.89482880,0.01000,0.962
26,self_attn.v_proj,16.12155724,0.01000,0.946
26,self_attn.q_proj,115.92766571,0.01000,0.973
26,self_attn.o_proj,1.13301432,0.01000,0.964
26,mlp.up_proj,165.55546570,0.01000,0.979
26,mlp.gate_proj,267.83300781,0.01000,0.980
26,mlp.down_proj,5.34906912,0.01000,3.989
27,self_attn.k_proj,78.91761017,0.01000,0.949
27,self_attn.v_proj,22.78813553,0.01000,0.942
27,self_attn.q_proj,121.86432648,0.01000,0.958
27,self_attn.o_proj,2.07942438,0.01000,0.957
27,mlp.up_proj,177.88153076,0.01000,0.983
27,mlp.gate_proj,286.12225342,0.01000,0.976
27,mlp.down_proj,6.25214195,0.01000,4.000
28,self_attn.k_proj,63.79434967,0.01000,0.944
28,self_attn.v_proj,21.07311058,0.01000,0.961
28,self_attn.q_proj,113.87142944,0.01000,0.958
28,self_attn.o_proj,2.18213129,0.01000,0.968
28,mlp.up_proj,199.46273804,0.01000,0.981
28,mlp.gate_proj,306.04187012,0.01000,0.972
28,mlp.down_proj,8.34402084,0.01000,4.050
29,self_attn.k_proj,69.20089722,0.01000,0.959
29,self_attn.v_proj,25.57469940,0.01000,0.970
29,self_attn.q_proj,121.13464355,0.01000,0.961
29,self_attn.o_proj,2.17307186,0.01000,0.963
29,mlp.up_proj,211.52079773,0.01000,0.991
29,mlp.gate_proj,309.66699219,0.01000,0.979
29,mlp.down_proj,11.10927391,0.01000,4.111
30,self_attn.k_proj,67.66032410,0.01000,0.949
30,self_attn.v_proj,34.74767303,0.01000,0.963
30,self_attn.q_proj,114.53169250,0.01000,0.972
30,self_attn.o_proj,5.75792027,0.01000,1.466
30,mlp.up_proj,228.85681152,0.01000,0.989
30,mlp.gate_proj,343.39981079,0.01000,0.978
30,mlp.down_proj,18.97526741,0.01000,4.010
31,self_attn.k_proj,49.98130417,0.01000,0.948
31,self_attn.v_proj,21.36197281,0.01000,0.948
31,self_attn.q_proj,95.31225586,0.01000,0.988
31,self_attn.o_proj,6.19356155,0.01000,0.968
31,mlp.up_proj,220.62313843,0.01000,0.987
31,mlp.gate_proj,322.52499390,0.01000,0.998
31,mlp.down_proj,55.03264236,0.01000,4.004