opt-1.3b-random-tb / quant_log.csv
iproskurina's picture
Add files using upload-large-folder tool
2c8413d verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00409379,0.01000,1.000
0,self_attn.v_proj,0.00072114,0.01000,1.006
0,self_attn.q_proj,0.00414090,0.01000,0.980
0,self_attn.out_proj,0.00001473,0.01000,1.009
0,fc1,0.00906052,0.01000,0.986
0,fc2,0.00011689,0.01000,4.245
1,self_attn.k_proj,0.00241560,0.01000,0.998
1,self_attn.v_proj,0.00030304,0.01000,0.979
1,self_attn.q_proj,0.00263582,0.01000,0.991
1,self_attn.out_proj,0.00001348,0.01000,0.990
1,fc1,0.00911925,0.01000,1.001
1,fc2,0.00113884,0.01000,4.272
2,self_attn.k_proj,0.00382860,0.01000,1.008
2,self_attn.v_proj,0.00054063,0.01000,0.996
2,self_attn.q_proj,0.00378607,0.01000,0.999
2,self_attn.out_proj,0.00000811,0.01000,0.978
2,fc1,0.01030087,0.01000,1.010
2,fc2,0.00010722,0.01000,4.167
3,self_attn.k_proj,0.00392859,0.01000,0.990
3,self_attn.v_proj,0.00063046,0.01000,0.989
3,self_attn.q_proj,0.00420090,0.01000,0.973
3,self_attn.out_proj,0.00001649,0.01000,1.002
3,fc1,0.00846032,0.01000,0.985
3,fc2,0.00012199,0.01000,4.221
4,self_attn.k_proj,0.00556619,0.01000,0.996
4,self_attn.v_proj,0.00072275,0.01000,0.987
4,self_attn.q_proj,0.00558837,0.01000,0.993
4,self_attn.out_proj,0.00001731,0.01000,1.013
4,fc1,0.00879328,0.01000,0.989
4,fc2,0.00011329,0.01000,4.202
5,self_attn.k_proj,0.00716568,0.01000,0.991
5,self_attn.v_proj,0.00093275,0.01000,0.987
5,self_attn.q_proj,0.00673818,0.01000,1.002
5,self_attn.out_proj,0.00003818,0.01000,1.005
5,fc1,0.01022671,0.01000,0.978
5,fc2,0.00017304,0.01000,4.199
6,self_attn.k_proj,0.01196123,0.01000,1.025
6,self_attn.v_proj,0.00122724,0.01000,1.007
6,self_attn.q_proj,0.00925438,0.01000,1.007
6,self_attn.out_proj,0.00006164,0.01000,1.004
6,fc1,0.01337742,0.01000,0.994
6,fc2,0.00021436,0.01000,4.231
7,self_attn.k_proj,0.01336243,0.01000,0.995
7,self_attn.v_proj,0.00149999,0.01000,0.978
7,self_attn.q_proj,0.01013738,0.01000,0.991
7,self_attn.out_proj,0.00006549,0.01000,0.991
7,fc1,0.01671198,0.01000,0.994
7,fc2,0.00019174,0.01000,4.216
8,self_attn.k_proj,0.01508483,0.01000,0.983
8,self_attn.v_proj,0.00175653,0.01000,1.034
8,self_attn.q_proj,0.01071484,0.01000,0.995
8,self_attn.out_proj,0.00006830,0.01000,0.985
8,fc1,0.01985171,0.01000,0.993
8,fc2,0.00024323,0.01000,4.181
9,self_attn.k_proj,0.01629625,0.01000,0.994
9,self_attn.v_proj,0.00207414,0.01000,0.989
9,self_attn.q_proj,0.01226537,0.01000,0.987
9,self_attn.out_proj,0.00007884,0.01000,1.017
9,fc1,0.02325909,0.01000,0.996
9,fc2,0.00029927,0.01000,4.260
10,self_attn.k_proj,0.01694436,0.01000,0.984
10,self_attn.v_proj,0.00279443,0.01000,1.003
10,self_attn.q_proj,0.01290223,0.01000,1.009
10,self_attn.out_proj,0.00008043,0.01000,0.984
10,fc1,0.02705885,0.01000,1.041
10,fc2,0.00040550,0.01000,4.158
11,self_attn.k_proj,0.01743016,0.01000,0.992
11,self_attn.v_proj,0.00366602,0.01000,0.991
11,self_attn.q_proj,0.01367142,0.01000,1.000
11,self_attn.out_proj,0.00010108,0.01000,0.988
11,fc1,0.03210959,0.01000,1.008
11,fc2,0.00055330,0.01000,4.275
12,self_attn.k_proj,0.02062906,0.01000,0.982
12,self_attn.v_proj,0.00437126,0.01000,0.979
12,self_attn.q_proj,0.01520991,0.01000,0.995
12,self_attn.out_proj,0.00014373,0.01000,0.980
12,fc1,0.03572238,0.01000,1.010
12,fc2,0.00066190,0.01000,4.168
13,self_attn.k_proj,0.02250100,0.01000,0.984
13,self_attn.v_proj,0.00493668,0.01000,1.048
13,self_attn.q_proj,0.01598719,0.01000,1.047
13,self_attn.out_proj,0.00015132,0.01000,0.999
13,fc1,0.03995991,0.01000,1.019
13,fc2,0.00083408,0.01000,4.255
14,self_attn.k_proj,0.02120009,0.01000,0.979
14,self_attn.v_proj,0.00648613,0.01000,0.987
14,self_attn.q_proj,0.01573154,0.01000,0.990
14,self_attn.out_proj,0.00017486,0.01000,1.005
14,fc1,0.04477219,0.01000,0.981
14,fc2,0.00120158,0.01000,4.182
15,self_attn.k_proj,0.01888706,0.01000,0.996
15,self_attn.v_proj,0.00828507,0.01000,0.989
15,self_attn.q_proj,0.01590251,0.01000,1.019
15,self_attn.out_proj,0.00018840,0.01000,1.015
15,fc1,0.04777357,0.01000,1.004
15,fc2,0.00149223,0.01000,4.271
16,self_attn.k_proj,0.01895629,0.01000,0.994
16,self_attn.v_proj,0.00919615,0.01000,0.988
16,self_attn.q_proj,0.01408941,0.01000,0.987
16,self_attn.out_proj,0.00027497,0.01000,0.993
16,fc1,0.05255585,0.01000,0.994
16,fc2,0.00180443,0.01000,4.196
17,self_attn.k_proj,0.01800555,0.01000,0.990
17,self_attn.v_proj,0.01010960,0.01000,0.976
17,self_attn.q_proj,0.01410830,0.01000,0.985
17,self_attn.out_proj,0.00029745,0.01000,0.998
17,fc1,0.05777301,0.01000,1.011
17,fc2,0.00218752,0.01000,4.182
18,self_attn.k_proj,0.01598491,0.01000,1.027
18,self_attn.v_proj,0.01118781,0.01000,0.995
18,self_attn.q_proj,0.01337853,0.01000,0.999
18,self_attn.out_proj,0.00052338,0.01000,0.985
18,fc1,0.05900865,0.01000,1.069
18,fc2,0.00268790,0.01000,4.194
19,self_attn.k_proj,0.01571657,0.01000,0.997
19,self_attn.v_proj,0.01393012,0.01000,1.016
19,self_attn.q_proj,0.01293182,0.01000,0.997
19,self_attn.out_proj,0.00089465,0.01000,1.000
19,fc1,0.06260797,0.01000,1.066
19,fc2,0.00281360,0.01000,4.196
20,self_attn.k_proj,0.01550068,0.01000,0.983
20,self_attn.v_proj,0.01531409,0.01000,0.990
20,self_attn.q_proj,0.01223863,0.01000,1.027
20,self_attn.out_proj,0.00108642,0.01000,1.043
20,fc1,0.06158617,0.01000,0.997
20,fc2,0.00320006,0.01000,4.245
21,self_attn.k_proj,0.01362426,0.01000,1.005
21,self_attn.v_proj,0.01469827,0.01000,0.990
21,self_attn.q_proj,0.01251260,0.01000,0.993
21,self_attn.out_proj,0.00081556,0.01000,0.997
21,fc1,0.05632990,0.01000,1.020
21,fc2,0.00376281,0.01000,4.198
22,self_attn.k_proj,0.01262085,0.01000,1.009
22,self_attn.v_proj,0.01517828,0.01000,1.001
22,self_attn.q_proj,0.01358408,0.01000,1.001
22,self_attn.out_proj,0.00131237,0.01000,1.007
22,fc1,0.04993823,0.01000,1.032
22,fc2,0.00548277,0.01000,4.281
23,self_attn.k_proj,0.01658067,0.01000,1.060
23,self_attn.v_proj,0.00926656,0.01000,0.979
23,self_attn.q_proj,0.02430908,0.01000,0.970
23,self_attn.out_proj,0.00185453,0.01000,1.000
23,fc1,0.03861813,0.01000,0.996
23,fc2,0.00391702,0.01000,4.238