SGPT-125M-mean-nli-bitfit / eval /similarity_evaluation_sts-dev_results.csv
Muennighoff's picture
Add SGPT-125M-mean-nli-bitfit
7fa8bc7
epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
0,880,0.7931236103126509,0.7958887004968382,0.7911788235272386,0.7952473779901977,0.7931304731755554,0.7976689017226692,0.6381018595848362,0.6525860855879394
0,1760,0.8006784180926224,0.8060745028998347,0.7976865474131043,0.8028706946390303,0.8002043770569829,0.8060720028981094,0.642754000333759,0.6612242890581526
0,2640,0.8052127901513646,0.8123222598805175,0.7972111700084781,0.8032635169741782,0.7986628130829496,0.8057808852594837,0.6702855681428217,0.6759604077686308
0,3520,0.8075121659952258,0.8152759238405808,0.7990270914061948,0.805254973864518,0.8004195326261134,0.8072635926884097,0.6708924694573102,0.6838648171381387
0,4400,0.8106280964751671,0.8183566677972659,0.8017786608346288,0.8077155769860941,0.8038951930229069,0.8107182214070056,0.675365913797557,0.6858701530416154
0,5280,0.813518228848735,0.8211813869907371,0.8023898568919567,0.8080751501879759,0.8045323391526399,0.8107497249874653,0.676585768512286,0.6910476548353052
0,6160,0.8110038560977901,0.8196029072537244,0.7992417445793695,0.8054486216849892,0.8009445509179719,0.8079312531199992,0.678196437460992,0.689390726645578
0,7040,0.8157543579955957,0.8238793497067225,0.8029583704525003,0.8090371206027318,0.8044661132679434,0.811190935977421,0.6907229472475003,0.6981372486958811
0,7920,0.8145191170896149,0.8224058042058273,0.8019285473685569,0.8080554864733382,0.8036972955743046,0.8104438511108981,0.6817964515054133,0.6945717800431424
0,8800,0.8151300277680787,0.8233908725012917,0.8019063133571251,0.8083050471437834,0.803326408362116,0.8102837976196606,0.6895925378534694,0.6996077764010994
0,-1,0.8151250812171511,0.8233968173452519,0.8018721693747763,0.8082618531637968,0.8032853622824496,0.8102656267886152,0.6895803174365294,0.6996784988698346