SGPT-125M-scratchmean-nli / eval /similarity_evaluation_sts-dev_results.csv
Muennighoff's picture
Add SGPT-125M-scratchmean-nli
328c780
epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
0,880,0.5298895446169344,0.5312240374218833,0.5117367201753408,0.5245744420855956,0.5104904261012467,0.5231746284173534,0.4585831281872321,0.4757636486142692
0,1760,0.6414522822064204,0.6466598626369797,0.6315813393117423,0.6351470966847795,0.6299802345481992,0.633638220198648,0.5564450205278492,0.5860890895197167
0,2640,0.6651305710363661,0.6758417801736336,0.6722952033313845,0.6762575147352333,0.6732778021726432,0.6770590704485377,0.5615850866939909,0.5915882175060602
0,3520,0.6936786606162212,0.7000569579383393,0.6870984944729166,0.6926032039515108,0.6852739285305858,0.6900644263987616,0.5915931944462255,0.6139743454184338
0,4400,0.700899713888771,0.7047739810339679,0.6920555918002221,0.6958745033620944,0.6916965374691982,0.6954146507315779,0.6066928354981058,0.6273693546624726
0,5280,0.7141938628219852,0.7201963457696333,0.6962514159036581,0.6984396706127707,0.6952247227203017,0.6971711750754467,0.6170316020557418,0.6385997236226345
0,6160,0.7118754507353484,0.7179873371277351,0.6992091001590869,0.7010723806146854,0.6987773965936882,0.7003257377506648,0.619611553839931,0.6403750629261068
0,7040,0.7189095591545901,0.7236743303762333,0.7004906826331114,0.7015026404319671,0.6996276311227727,0.7006774675307638,0.623697167086132,0.6521847383358765
0,7920,0.725586194362776,0.7296134020905084,0.7079407270210554,0.7094840376652114,0.707021328265756,0.7083845297889915,0.6309189030417285,0.655483391857864
0,8800,0.7267545474582126,0.7307983815559623,0.7085992003709655,0.7102699385634418,0.707714153882588,0.709112834562065,0.6312806322363824,0.6558650202351088
0,-1,0.7267570775457864,0.7308159723154326,0.7085975081646948,0.7102818638385754,0.7077130942522993,0.7091036181041682,0.631292016689388,0.6558531305471883