|
{ |
|
"best_metric": 0.8548645464866416, |
|
"best_model_checkpoint": "result/InfoCSE-bert-base", |
|
"epoch": 2.0, |
|
"global_step": 31252, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.01, |
|
"eval_avg_sts": 0.645032772395593, |
|
"eval_sickr_spearman": 0.6463705264094609, |
|
"eval_stsb_spearman": 0.643695018381725, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_avg_sts": 0.685240727331801, |
|
"eval_sickr_spearman": 0.669725073110526, |
|
"eval_stsb_spearman": 0.700756381553076, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_avg_sts": 0.7027556246143734, |
|
"eval_sickr_spearman": 0.6818145493736003, |
|
"eval_stsb_spearman": 0.7236966998551464, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"learning_rate": 6.888007167541277e-06, |
|
"loss": 0.0008, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_avg_sts": 0.7085517582757557, |
|
"eval_sickr_spearman": 0.6868034438177743, |
|
"eval_stsb_spearman": 0.730300072733737, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.04, |
|
"eval_avg_sts": 0.7152446421256347, |
|
"eval_sickr_spearman": 0.6908805158322469, |
|
"eval_stsb_spearman": 0.7396087684190223, |
|
"step": 625 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_avg_sts": 0.744333698385975, |
|
"eval_sickr_spearman": 0.7107611650906991, |
|
"eval_stsb_spearman": 0.7779062316812507, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_avg_sts": 0.749906268768782, |
|
"eval_sickr_spearman": 0.7164115438638786, |
|
"eval_stsb_spearman": 0.7834009936736853, |
|
"step": 875 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"learning_rate": 6.776014335082554e-06, |
|
"loss": 0.0003, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_avg_sts": 0.7527465185576756, |
|
"eval_sickr_spearman": 0.7194187230938174, |
|
"eval_stsb_spearman": 0.7860743140215339, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.07, |
|
"eval_avg_sts": 0.7563795190354858, |
|
"eval_sickr_spearman": 0.7197145466475747, |
|
"eval_stsb_spearman": 0.793044491423397, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_avg_sts": 0.7577088125126856, |
|
"eval_sickr_spearman": 0.7209790134240346, |
|
"eval_stsb_spearman": 0.7944386116013368, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"eval_avg_sts": 0.7618327362445115, |
|
"eval_sickr_spearman": 0.7205304029366025, |
|
"eval_stsb_spearman": 0.8031350695524205, |
|
"step": 1375 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"learning_rate": 6.6640215026238325e-06, |
|
"loss": 0.0004, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_avg_sts": 0.7526454517508075, |
|
"eval_sickr_spearman": 0.7131317881332785, |
|
"eval_stsb_spearman": 0.7921591153683366, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_avg_sts": 0.7584465941723788, |
|
"eval_sickr_spearman": 0.7183862465373038, |
|
"eval_stsb_spearman": 0.798506941807454, |
|
"step": 1625 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_avg_sts": 0.7600830398569421, |
|
"eval_sickr_spearman": 0.7199089285150947, |
|
"eval_stsb_spearman": 0.8002571511987896, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 0.12, |
|
"eval_avg_sts": 0.753643480678329, |
|
"eval_sickr_spearman": 0.7154178764373269, |
|
"eval_stsb_spearman": 0.7918690849193311, |
|
"step": 1875 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 6.55202867016511e-06, |
|
"loss": 0.0002, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_avg_sts": 0.7563852037282979, |
|
"eval_sickr_spearman": 0.7193429780468495, |
|
"eval_stsb_spearman": 0.7934274294097461, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_avg_sts": 0.7664707372188553, |
|
"eval_sickr_spearman": 0.7240147231282276, |
|
"eval_stsb_spearman": 0.8089267513094829, |
|
"step": 2125 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_avg_sts": 0.7706419135337745, |
|
"eval_sickr_spearman": 0.7288192261739805, |
|
"eval_stsb_spearman": 0.8124646008935686, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 0.15, |
|
"eval_avg_sts": 0.7712663844837009, |
|
"eval_sickr_spearman": 0.7299219242007967, |
|
"eval_stsb_spearman": 0.8126108447666052, |
|
"step": 2375 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"learning_rate": 6.440035837706387e-06, |
|
"loss": 0.0002, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_avg_sts": 0.7728606127631258, |
|
"eval_sickr_spearman": 0.7312590620337324, |
|
"eval_stsb_spearman": 0.8144621634925192, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_avg_sts": 0.7729813550763709, |
|
"eval_sickr_spearman": 0.7313422519014231, |
|
"eval_stsb_spearman": 0.8146204582513188, |
|
"step": 2625 |
|
}, |
|
{ |
|
"epoch": 0.18, |
|
"eval_avg_sts": 0.7754932728462534, |
|
"eval_sickr_spearman": 0.7312568526030662, |
|
"eval_stsb_spearman": 0.8197296930894405, |
|
"step": 2750 |
|
}, |
|
{ |
|
"epoch": 0.18, |
|
"eval_avg_sts": 0.7712885427125948, |
|
"eval_sickr_spearman": 0.7266254056157947, |
|
"eval_stsb_spearman": 0.8159516798093949, |
|
"step": 2875 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"learning_rate": 6.328043005247664e-06, |
|
"loss": 0.0002, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_avg_sts": 0.7716849957034901, |
|
"eval_sickr_spearman": 0.7262548936993011, |
|
"eval_stsb_spearman": 0.8171150977076791, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_avg_sts": 0.7711561198226983, |
|
"eval_sickr_spearman": 0.7262503241591916, |
|
"eval_stsb_spearman": 0.816061915486205, |
|
"step": 3125 |
|
}, |
|
{ |
|
"epoch": 0.21, |
|
"eval_avg_sts": 0.7783568816799603, |
|
"eval_sickr_spearman": 0.7303159233258935, |
|
"eval_stsb_spearman": 0.8263978400340272, |
|
"step": 3250 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_avg_sts": 0.7809228297940308, |
|
"eval_sickr_spearman": 0.7337628272894983, |
|
"eval_stsb_spearman": 0.8280828322985634, |
|
"step": 3375 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"learning_rate": 6.2160501727889415e-06, |
|
"loss": 0.0001, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_avg_sts": 0.7797812899347809, |
|
"eval_sickr_spearman": 0.7324181485736369, |
|
"eval_stsb_spearman": 0.8271444312959251, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"eval_avg_sts": 0.780044187865891, |
|
"eval_sickr_spearman": 0.7338939041653229, |
|
"eval_stsb_spearman": 0.8261944715664592, |
|
"step": 3625 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_avg_sts": 0.7787673562775448, |
|
"eval_sickr_spearman": 0.7328702653314738, |
|
"eval_stsb_spearman": 0.8246644472236156, |
|
"step": 3750 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_avg_sts": 0.779541327716536, |
|
"eval_sickr_spearman": 0.7329598913667574, |
|
"eval_stsb_spearman": 0.8261227640663145, |
|
"step": 3875 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"learning_rate": 6.104057340330219e-06, |
|
"loss": 0.0003, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_avg_sts": 0.7747719384340315, |
|
"eval_sickr_spearman": 0.7285930957484098, |
|
"eval_stsb_spearman": 0.8209507811196531, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_avg_sts": 0.7765396311685044, |
|
"eval_sickr_spearman": 0.7301922912707919, |
|
"eval_stsb_spearman": 0.8228869710662171, |
|
"step": 4125 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_avg_sts": 0.7728155845030844, |
|
"eval_sickr_spearman": 0.7257823156922516, |
|
"eval_stsb_spearman": 0.8198488533139171, |
|
"step": 4250 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_avg_sts": 0.7734186821765212, |
|
"eval_sickr_spearman": 0.7266760303967105, |
|
"eval_stsb_spearman": 0.8201613339563318, |
|
"step": 4375 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"learning_rate": 5.992064507871497e-06, |
|
"loss": 0.0004, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"eval_avg_sts": 0.7731296739509669, |
|
"eval_sickr_spearman": 0.7214541370794603, |
|
"eval_stsb_spearman": 0.8248052108224735, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_avg_sts": 0.7728203601265164, |
|
"eval_sickr_spearman": 0.7219969845879138, |
|
"eval_stsb_spearman": 0.8236437356651191, |
|
"step": 4625 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_avg_sts": 0.773140320693449, |
|
"eval_sickr_spearman": 0.7226297943493609, |
|
"eval_stsb_spearman": 0.823650847037537, |
|
"step": 4750 |
|
}, |
|
{ |
|
"epoch": 0.31, |
|
"eval_avg_sts": 0.7776841987101548, |
|
"eval_sickr_spearman": 0.7260857761911376, |
|
"eval_stsb_spearman": 0.8292826212291721, |
|
"step": 4875 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"learning_rate": 5.880071675412773e-06, |
|
"loss": 0.0001, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_avg_sts": 0.7787697170418183, |
|
"eval_sickr_spearman": 0.7268813633553585, |
|
"eval_stsb_spearman": 0.8306580707282781, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_avg_sts": 0.7794054673251014, |
|
"eval_sickr_spearman": 0.727022190544775, |
|
"eval_stsb_spearman": 0.8317887441054277, |
|
"step": 5125 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"eval_avg_sts": 0.7794784586068343, |
|
"eval_sickr_spearman": 0.7302013691489637, |
|
"eval_stsb_spearman": 0.8287555480647049, |
|
"step": 5250 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"eval_avg_sts": 0.7771717407788259, |
|
"eval_sickr_spearman": 0.7244288472848269, |
|
"eval_stsb_spearman": 0.829914634272825, |
|
"step": 5375 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"learning_rate": 5.7680788429540505e-06, |
|
"loss": 0.0003, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_avg_sts": 0.778478777290903, |
|
"eval_sickr_spearman": 0.7256252059594475, |
|
"eval_stsb_spearman": 0.8313323486223586, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"eval_avg_sts": 0.7793214110914728, |
|
"eval_sickr_spearman": 0.726303453142855, |
|
"eval_stsb_spearman": 0.8323393690400904, |
|
"step": 5625 |
|
}, |
|
{ |
|
"epoch": 0.37, |
|
"eval_avg_sts": 0.7791715295390024, |
|
"eval_sickr_spearman": 0.7257507592586067, |
|
"eval_stsb_spearman": 0.8325922998193981, |
|
"step": 5750 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_avg_sts": 0.7800081020871235, |
|
"eval_sickr_spearman": 0.726603503433539, |
|
"eval_stsb_spearman": 0.8334127007407081, |
|
"step": 5875 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"learning_rate": 5.656086010495328e-06, |
|
"loss": 0.0001, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_avg_sts": 0.7802662913925068, |
|
"eval_sickr_spearman": 0.7272382344390437, |
|
"eval_stsb_spearman": 0.8332943483459699, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_avg_sts": 0.7788831909074992, |
|
"eval_sickr_spearman": 0.7254892779423776, |
|
"eval_stsb_spearman": 0.8322771038726209, |
|
"step": 6125 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_avg_sts": 0.7790896526834474, |
|
"eval_sickr_spearman": 0.7246235173389557, |
|
"eval_stsb_spearman": 0.8335557880279391, |
|
"step": 6250 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"eval_avg_sts": 0.7811606337604482, |
|
"eval_sickr_spearman": 0.7249414832304759, |
|
"eval_stsb_spearman": 0.8373797842904204, |
|
"step": 6375 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"learning_rate": 5.544093178036605e-06, |
|
"loss": 0.0001, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_avg_sts": 0.7814213566702608, |
|
"eval_sickr_spearman": 0.7254279422258411, |
|
"eval_stsb_spearman": 0.8374147711146805, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_avg_sts": 0.7818500804137162, |
|
"eval_sickr_spearman": 0.726220023119657, |
|
"eval_stsb_spearman": 0.8374801377077753, |
|
"step": 6625 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_avg_sts": 0.7832040571269738, |
|
"eval_sickr_spearman": 0.7301835015792287, |
|
"eval_stsb_spearman": 0.8362246126747188, |
|
"step": 6750 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_avg_sts": 0.7841900708722672, |
|
"eval_sickr_spearman": 0.731056755034475, |
|
"eval_stsb_spearman": 0.8373233867100595, |
|
"step": 6875 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"learning_rate": 5.432100345577883e-06, |
|
"loss": 0.0001, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_avg_sts": 0.7862472754964975, |
|
"eval_sickr_spearman": 0.7333967342343369, |
|
"eval_stsb_spearman": 0.839097816758658, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_avg_sts": 0.7859634761320248, |
|
"eval_sickr_spearman": 0.7330241089493801, |
|
"eval_stsb_spearman": 0.8389028433146695, |
|
"step": 7125 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_avg_sts": 0.7821803440191185, |
|
"eval_sickr_spearman": 0.7303841755210372, |
|
"eval_stsb_spearman": 0.8339765125171998, |
|
"step": 7250 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_avg_sts": 0.7825744125697178, |
|
"eval_sickr_spearman": 0.7306357624303699, |
|
"eval_stsb_spearman": 0.8345130627090659, |
|
"step": 7375 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"learning_rate": 5.32010751311916e-06, |
|
"loss": 0.0001, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_avg_sts": 0.78116110534451, |
|
"eval_sickr_spearman": 0.7276775268927966, |
|
"eval_stsb_spearman": 0.8346446837962234, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_avg_sts": 0.7799908773501631, |
|
"eval_sickr_spearman": 0.7237501678215064, |
|
"eval_stsb_spearman": 0.83623158687882, |
|
"step": 7625 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_avg_sts": 0.780269211830304, |
|
"eval_sickr_spearman": 0.7244608359983847, |
|
"eval_stsb_spearman": 0.8360775876622232, |
|
"step": 7750 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_avg_sts": 0.7807594418954099, |
|
"eval_sickr_spearman": 0.7247573319875622, |
|
"eval_stsb_spearman": 0.8367615518032576, |
|
"step": 7875 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"learning_rate": 5.2081146806604376e-06, |
|
"loss": 0.0001, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"eval_avg_sts": 0.7809657512161441, |
|
"eval_sickr_spearman": 0.7257775125821077, |
|
"eval_stsb_spearman": 0.8361539898501805, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"eval_avg_sts": 0.7808305047079998, |
|
"eval_sickr_spearman": 0.7258256397457487, |
|
"eval_stsb_spearman": 0.8358353696702507, |
|
"step": 8125 |
|
}, |
|
{ |
|
"epoch": 0.53, |
|
"eval_avg_sts": 0.7808244974473546, |
|
"eval_sickr_spearman": 0.7260765061885599, |
|
"eval_stsb_spearman": 0.8355724887061494, |
|
"step": 8250 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_avg_sts": 0.7807531331871759, |
|
"eval_sickr_spearman": 0.725998455648723, |
|
"eval_stsb_spearman": 0.8355078107256287, |
|
"step": 8375 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"learning_rate": 5.096121848201715e-06, |
|
"loss": 0.0001, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_avg_sts": 0.7805553727181309, |
|
"eval_sickr_spearman": 0.7259074847425994, |
|
"eval_stsb_spearman": 0.8352032606936624, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_avg_sts": 0.7840901636781107, |
|
"eval_sickr_spearman": 0.727197936344937, |
|
"eval_stsb_spearman": 0.8409823910112844, |
|
"step": 8625 |
|
}, |
|
{ |
|
"epoch": 0.56, |
|
"eval_avg_sts": 0.7841336470257416, |
|
"eval_sickr_spearman": 0.7241774524998998, |
|
"eval_stsb_spearman": 0.8440898415515834, |
|
"step": 8750 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_avg_sts": 0.7848770188208263, |
|
"eval_sickr_spearman": 0.7246812987539857, |
|
"eval_stsb_spearman": 0.8450727388876668, |
|
"step": 8875 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"learning_rate": 4.984129015742992e-06, |
|
"loss": 0.0001, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_avg_sts": 0.7851602291221325, |
|
"eval_sickr_spearman": 0.7257603654788943, |
|
"eval_stsb_spearman": 0.8445600927653706, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_avg_sts": 0.7881113225894085, |
|
"eval_sickr_spearman": 0.7297208179790754, |
|
"eval_stsb_spearman": 0.8465018271997418, |
|
"step": 9125 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"eval_avg_sts": 0.7883865180777926, |
|
"eval_sickr_spearman": 0.7305029084037921, |
|
"eval_stsb_spearman": 0.8462701277517931, |
|
"step": 9250 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_avg_sts": 0.7905936766250409, |
|
"eval_sickr_spearman": 0.7318727073857056, |
|
"eval_stsb_spearman": 0.8493146458643761, |
|
"step": 9375 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"learning_rate": 4.872136183284269e-06, |
|
"loss": 0.0002, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_avg_sts": 0.7894195399749903, |
|
"eval_sickr_spearman": 0.7297918559781024, |
|
"eval_stsb_spearman": 0.8490472239718782, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 0.62, |
|
"eval_avg_sts": 0.7888302258840285, |
|
"eval_sickr_spearman": 0.7290175946229199, |
|
"eval_stsb_spearman": 0.848642857145137, |
|
"step": 9625 |
|
}, |
|
{ |
|
"epoch": 0.62, |
|
"eval_avg_sts": 0.7898168606884958, |
|
"eval_sickr_spearman": 0.7311126152054476, |
|
"eval_stsb_spearman": 0.848521106171544, |
|
"step": 9750 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_avg_sts": 0.7916780015304804, |
|
"eval_sickr_spearman": 0.7336695508905056, |
|
"eval_stsb_spearman": 0.8496864521704552, |
|
"step": 9875 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"learning_rate": 4.760143350825547e-06, |
|
"loss": 0.0001, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_avg_sts": 0.7916349913886156, |
|
"eval_sickr_spearman": 0.7339293030870828, |
|
"eval_stsb_spearman": 0.8493406796901484, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_avg_sts": 0.791507759549186, |
|
"eval_sickr_spearman": 0.7339989962152694, |
|
"eval_stsb_spearman": 0.8490165228831026, |
|
"step": 10125 |
|
}, |
|
{ |
|
"epoch": 0.66, |
|
"eval_avg_sts": 0.789931989918206, |
|
"eval_sickr_spearman": 0.7311775052234905, |
|
"eval_stsb_spearman": 0.8486864746129216, |
|
"step": 10250 |
|
}, |
|
{ |
|
"epoch": 0.66, |
|
"eval_avg_sts": 0.7899616736779131, |
|
"eval_sickr_spearman": 0.7317643492208613, |
|
"eval_stsb_spearman": 0.8481589981349649, |
|
"step": 10375 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"learning_rate": 4.648150518366825e-06, |
|
"loss": 0.0001, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"eval_avg_sts": 0.7926863693434811, |
|
"eval_sickr_spearman": 0.7347004424206716, |
|
"eval_stsb_spearman": 0.8506722962662906, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"eval_avg_sts": 0.7925310701894714, |
|
"eval_sickr_spearman": 0.7345030826248625, |
|
"eval_stsb_spearman": 0.8505590577540805, |
|
"step": 10625 |
|
}, |
|
{ |
|
"epoch": 0.69, |
|
"eval_avg_sts": 0.7921847237714013, |
|
"eval_sickr_spearman": 0.734286503995874, |
|
"eval_stsb_spearman": 0.8500829435469286, |
|
"step": 10750 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_avg_sts": 0.792045037000692, |
|
"eval_sickr_spearman": 0.7345833425953655, |
|
"eval_stsb_spearman": 0.8495067314060183, |
|
"step": 10875 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"learning_rate": 4.536157685908102e-06, |
|
"loss": 0.0001, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_avg_sts": 0.7924996456713199, |
|
"eval_sickr_spearman": 0.7354074602338407, |
|
"eval_stsb_spearman": 0.8495918311087991, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"eval_avg_sts": 0.7924266596358673, |
|
"eval_sickr_spearman": 0.7356516503535521, |
|
"eval_stsb_spearman": 0.8492016689181826, |
|
"step": 11125 |
|
}, |
|
{ |
|
"epoch": 0.72, |
|
"eval_avg_sts": 0.7926706111519558, |
|
"eval_sickr_spearman": 0.7358917097985398, |
|
"eval_stsb_spearman": 0.8494495125053718, |
|
"step": 11250 |
|
}, |
|
{ |
|
"epoch": 0.73, |
|
"eval_avg_sts": 0.7930288164708986, |
|
"eval_sickr_spearman": 0.7354914185991545, |
|
"eval_stsb_spearman": 0.8505662143426428, |
|
"step": 11375 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"learning_rate": 4.424164853449379e-06, |
|
"loss": 0.0002, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_avg_sts": 0.7926251189281965, |
|
"eval_sickr_spearman": 0.7351442017668584, |
|
"eval_stsb_spearman": 0.8501060360895348, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_avg_sts": 0.7932695687388167, |
|
"eval_sickr_spearman": 0.7365684199867013, |
|
"eval_stsb_spearman": 0.8499707174909322, |
|
"step": 11625 |
|
}, |
|
{ |
|
"epoch": 0.75, |
|
"eval_avg_sts": 0.7935921856407616, |
|
"eval_sickr_spearman": 0.7367729844477262, |
|
"eval_stsb_spearman": 0.850411386833797, |
|
"step": 11750 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"eval_avg_sts": 0.794782209944985, |
|
"eval_sickr_spearman": 0.7389587838119719, |
|
"eval_stsb_spearman": 0.8506056360779983, |
|
"step": 11875 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"learning_rate": 4.312172020990656e-06, |
|
"loss": 0.0002, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_avg_sts": 0.7971707208949131, |
|
"eval_sickr_spearman": 0.7394768953031847, |
|
"eval_stsb_spearman": 0.8548645464866416, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 0.78, |
|
"eval_avg_sts": 0.797638118412404, |
|
"eval_sickr_spearman": 0.7421029957743136, |
|
"eval_stsb_spearman": 0.8531732410504944, |
|
"step": 12125 |
|
}, |
|
{ |
|
"epoch": 0.78, |
|
"eval_avg_sts": 0.7969091025343611, |
|
"eval_sickr_spearman": 0.741429359576644, |
|
"eval_stsb_spearman": 0.8523888454920783, |
|
"step": 12250 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"eval_avg_sts": 0.7919648350492454, |
|
"eval_sickr_spearman": 0.7347034683800623, |
|
"eval_stsb_spearman": 0.8492262017184287, |
|
"step": 12375 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 4.2001791885319345e-06, |
|
"loss": 0.0005, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_avg_sts": 0.7921636059370547, |
|
"eval_sickr_spearman": 0.7353516480939697, |
|
"eval_stsb_spearman": 0.8489755637801396, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 0.81, |
|
"eval_avg_sts": 0.7924202367929077, |
|
"eval_sickr_spearman": 0.736975675695795, |
|
"eval_stsb_spearman": 0.8478647978900204, |
|
"step": 12625 |
|
}, |
|
{ |
|
"epoch": 0.82, |
|
"eval_avg_sts": 0.7890475112371416, |
|
"eval_sickr_spearman": 0.7355575093947334, |
|
"eval_stsb_spearman": 0.8425375130795496, |
|
"step": 12750 |
|
}, |
|
{ |
|
"epoch": 0.82, |
|
"eval_avg_sts": 0.7892144058224184, |
|
"eval_sickr_spearman": 0.7356575101479275, |
|
"eval_stsb_spearman": 0.8427713014969095, |
|
"step": 12875 |
|
}, |
|
{ |
|
"epoch": 0.83, |
|
"learning_rate": 4.088186356073212e-06, |
|
"loss": 0.0002, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 0.83, |
|
"eval_avg_sts": 0.7908518455947956, |
|
"eval_sickr_spearman": 0.73698621219475, |
|
"eval_stsb_spearman": 0.8447174789948412, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"eval_avg_sts": 0.7910358332545967, |
|
"eval_sickr_spearman": 0.7372511340625426, |
|
"eval_stsb_spearman": 0.8448205324466508, |
|
"step": 13125 |
|
}, |
|
{ |
|
"epoch": 0.85, |
|
"eval_avg_sts": 0.7910819619646265, |
|
"eval_sickr_spearman": 0.7366442130647706, |
|
"eval_stsb_spearman": 0.8455197108644826, |
|
"step": 13250 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"eval_avg_sts": 0.7913313391681369, |
|
"eval_sickr_spearman": 0.7369983463756739, |
|
"eval_stsb_spearman": 0.8456643319606, |
|
"step": 13375 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"learning_rate": 3.976193523614489e-06, |
|
"loss": 0.0002, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"eval_avg_sts": 0.7912515138401426, |
|
"eval_sickr_spearman": 0.7371570411348254, |
|
"eval_stsb_spearman": 0.8453459865454599, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"eval_avg_sts": 0.7912798783058242, |
|
"eval_sickr_spearman": 0.7375416261640404, |
|
"eval_stsb_spearman": 0.8450181304476081, |
|
"step": 13625 |
|
}, |
|
{ |
|
"epoch": 0.88, |
|
"eval_avg_sts": 0.7915843291718891, |
|
"eval_sickr_spearman": 0.7376919154804402, |
|
"eval_stsb_spearman": 0.845476742863338, |
|
"step": 13750 |
|
}, |
|
{ |
|
"epoch": 0.89, |
|
"eval_avg_sts": 0.7917255539871094, |
|
"eval_sickr_spearman": 0.7381062797925467, |
|
"eval_stsb_spearman": 0.8453448281816721, |
|
"step": 13875 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"learning_rate": 3.864200691155766e-06, |
|
"loss": 0.0001, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_avg_sts": 0.7916416194141285, |
|
"eval_sickr_spearman": 0.7380577683800943, |
|
"eval_stsb_spearman": 0.8452254704481627, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_avg_sts": 0.7924269371428458, |
|
"eval_sickr_spearman": 0.738714977941072, |
|
"eval_stsb_spearman": 0.8461388963446196, |
|
"step": 14125 |
|
}, |
|
{ |
|
"epoch": 0.91, |
|
"eval_avg_sts": 0.7923356777507629, |
|
"eval_sickr_spearman": 0.7386597902055195, |
|
"eval_stsb_spearman": 0.8460115652960062, |
|
"step": 14250 |
|
}, |
|
{ |
|
"epoch": 0.92, |
|
"eval_avg_sts": 0.7922805942330418, |
|
"eval_sickr_spearman": 0.7387613759850612, |
|
"eval_stsb_spearman": 0.8457998124810223, |
|
"step": 14375 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"learning_rate": 3.7522078586970435e-06, |
|
"loss": 0.0001, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_avg_sts": 0.7934966210957259, |
|
"eval_sickr_spearman": 0.7397510568301936, |
|
"eval_stsb_spearman": 0.8472421853612582, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"eval_avg_sts": 0.7930449265696451, |
|
"eval_sickr_spearman": 0.7393639741837038, |
|
"eval_stsb_spearman": 0.8467258789555864, |
|
"step": 14625 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"eval_avg_sts": 0.7924737714972381, |
|
"eval_sickr_spearman": 0.7393996612920722, |
|
"eval_stsb_spearman": 0.845547881702404, |
|
"step": 14750 |
|
}, |
|
{ |
|
"epoch": 0.95, |
|
"eval_avg_sts": 0.792308440851152, |
|
"eval_sickr_spearman": 0.739175211955052, |
|
"eval_stsb_spearman": 0.845441669747252, |
|
"step": 14875 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"learning_rate": 3.6402150262383203e-06, |
|
"loss": 0.0001, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"eval_avg_sts": 0.7932488441451628, |
|
"eval_sickr_spearman": 0.7404715713828667, |
|
"eval_stsb_spearman": 0.8460261169074589, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"eval_avg_sts": 0.7931158785146848, |
|
"eval_sickr_spearman": 0.7406130710077032, |
|
"eval_stsb_spearman": 0.8456186860216665, |
|
"step": 15125 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"eval_avg_sts": 0.7945903311020877, |
|
"eval_sickr_spearman": 0.7431428210893474, |
|
"eval_stsb_spearman": 0.8460378411148278, |
|
"step": 15250 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"eval_avg_sts": 0.7948596387785098, |
|
"eval_sickr_spearman": 0.7440196288461001, |
|
"eval_stsb_spearman": 0.8456996487109196, |
|
"step": 15375 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"learning_rate": 3.5282221937795976e-06, |
|
"loss": 0.0002, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_avg_sts": 0.7948372805541641, |
|
"eval_sickr_spearman": 0.744097679385937, |
|
"eval_stsb_spearman": 0.8455768817223914, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_avg_sts": 0.7937246352478757, |
|
"eval_sickr_spearman": 0.7439027691763012, |
|
"eval_stsb_spearman": 0.8435465013194503, |
|
"step": 15625 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"eval_avg_sts": 0.7937099307469273, |
|
"eval_sickr_spearman": 0.7440485435691657, |
|
"eval_stsb_spearman": 0.8433713179246888, |
|
"step": 15750 |
|
}, |
|
{ |
|
"epoch": 1.02, |
|
"eval_avg_sts": 0.7935877720189825, |
|
"eval_sickr_spearman": 0.7440728953375949, |
|
"eval_stsb_spearman": 0.84310264870037, |
|
"step": 15875 |
|
}, |
|
{ |
|
"epoch": 1.02, |
|
"learning_rate": 3.4162293613208757e-06, |
|
"loss": 0.0001, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 1.02, |
|
"eval_avg_sts": 0.7935863758797379, |
|
"eval_sickr_spearman": 0.744390621073608, |
|
"eval_stsb_spearman": 0.8427821306858677, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 1.03, |
|
"eval_avg_sts": 0.7937197747425322, |
|
"eval_sickr_spearman": 0.7444404293257993, |
|
"eval_stsb_spearman": 0.8429991201592651, |
|
"step": 16125 |
|
}, |
|
{ |
|
"epoch": 1.04, |
|
"eval_avg_sts": 0.7924446512199308, |
|
"eval_sickr_spearman": 0.7440353830473717, |
|
"eval_stsb_spearman": 0.8408539193924898, |
|
"step": 16250 |
|
}, |
|
{ |
|
"epoch": 1.05, |
|
"eval_avg_sts": 0.7905555822474897, |
|
"eval_sickr_spearman": 0.7383070017654566, |
|
"eval_stsb_spearman": 0.8428041627295226, |
|
"step": 16375 |
|
}, |
|
{ |
|
"epoch": 1.06, |
|
"learning_rate": 3.304236528862153e-06, |
|
"loss": 0.0001, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 1.06, |
|
"eval_avg_sts": 0.7899406430528368, |
|
"eval_sickr_spearman": 0.737816219970962, |
|
"eval_stsb_spearman": 0.8420650661347118, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 1.06, |
|
"eval_avg_sts": 0.7921524290697161, |
|
"eval_sickr_spearman": 0.7417105816755641, |
|
"eval_stsb_spearman": 0.842594276463868, |
|
"step": 16625 |
|
}, |
|
{ |
|
"epoch": 1.07, |
|
"eval_avg_sts": 0.7909061020892134, |
|
"eval_sickr_spearman": 0.7410022670226564, |
|
"eval_stsb_spearman": 0.8408099371557706, |
|
"step": 16750 |
|
}, |
|
{ |
|
"epoch": 1.08, |
|
"eval_avg_sts": 0.7911860344103485, |
|
"eval_sickr_spearman": 0.7404902554813262, |
|
"eval_stsb_spearman": 0.841881813339371, |
|
"step": 16875 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"learning_rate": 3.19224369640343e-06, |
|
"loss": 0.0002, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"eval_avg_sts": 0.7912332320403954, |
|
"eval_sickr_spearman": 0.7405556258103834, |
|
"eval_stsb_spearman": 0.8419108382704075, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 1.1, |
|
"eval_avg_sts": 0.791745368257589, |
|
"eval_sickr_spearman": 0.7407413620796446, |
|
"eval_stsb_spearman": 0.8427493744355335, |
|
"step": 17125 |
|
}, |
|
{ |
|
"epoch": 1.1, |
|
"eval_avg_sts": 0.7936116457907827, |
|
"eval_sickr_spearman": 0.7417212926111849, |
|
"eval_stsb_spearman": 0.8455019989703806, |
|
"step": 17250 |
|
}, |
|
{ |
|
"epoch": 1.11, |
|
"eval_avg_sts": 0.7936037695250758, |
|
"eval_sickr_spearman": 0.7418167304097425, |
|
"eval_stsb_spearman": 0.8453908086404092, |
|
"step": 17375 |
|
}, |
|
{ |
|
"epoch": 1.12, |
|
"learning_rate": 3.0802508639447074e-06, |
|
"loss": 0.0002, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 1.12, |
|
"eval_avg_sts": 0.792413452164604, |
|
"eval_sickr_spearman": 0.7425937295377067, |
|
"eval_stsb_spearman": 0.8422331747915013, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 1.13, |
|
"eval_avg_sts": 0.7927184217670188, |
|
"eval_sickr_spearman": 0.7428243748868126, |
|
"eval_stsb_spearman": 0.8426124686472249, |
|
"step": 17625 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"eval_avg_sts": 0.7926960182448954, |
|
"eval_sickr_spearman": 0.742725526880053, |
|
"eval_stsb_spearman": 0.842666509609738, |
|
"step": 17750 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"eval_avg_sts": 0.7927521207425385, |
|
"eval_sickr_spearman": 0.7428051144151359, |
|
"eval_stsb_spearman": 0.8426991270699412, |
|
"step": 17875 |
|
}, |
|
{ |
|
"epoch": 1.15, |
|
"learning_rate": 2.9682580314859847e-06, |
|
"loss": 0.0, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 1.15, |
|
"eval_avg_sts": 0.7928433137943678, |
|
"eval_sickr_spearman": 0.7426588116801555, |
|
"eval_stsb_spearman": 0.8430278159085801, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 1.16, |
|
"eval_avg_sts": 0.792833492411573, |
|
"eval_sickr_spearman": 0.7426310977346257, |
|
"eval_stsb_spearman": 0.8430358870885203, |
|
"step": 18125 |
|
}, |
|
{ |
|
"epoch": 1.17, |
|
"eval_avg_sts": 0.7928841848486375, |
|
"eval_sickr_spearman": 0.742908285221025, |
|
"eval_stsb_spearman": 0.84286008447625, |
|
"step": 18250 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"eval_avg_sts": 0.7925150543842555, |
|
"eval_sickr_spearman": 0.743895084200071, |
|
"eval_stsb_spearman": 0.84113502456844, |
|
"step": 18375 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"learning_rate": 2.8562651990272623e-06, |
|
"loss": 0.0001, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"eval_avg_sts": 0.7919487675309846, |
|
"eval_sickr_spearman": 0.7431525714029392, |
|
"eval_stsb_spearman": 0.84074496365903, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"eval_avg_sts": 0.7919787220051326, |
|
"eval_sickr_spearman": 0.7432353770218185, |
|
"eval_stsb_spearman": 0.8407220669884469, |
|
"step": 18625 |
|
}, |
|
{ |
|
"epoch": 1.2, |
|
"eval_avg_sts": 0.7920516311468476, |
|
"eval_sickr_spearman": 0.7433836010008565, |
|
"eval_stsb_spearman": 0.8407196612928387, |
|
"step": 18750 |
|
}, |
|
{ |
|
"epoch": 1.21, |
|
"eval_avg_sts": 0.79208040900112, |
|
"eval_sickr_spearman": 0.7434916709790923, |
|
"eval_stsb_spearman": 0.8406691470231478, |
|
"step": 18875 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"learning_rate": 2.7442723665685396e-06, |
|
"loss": 0.0001, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"eval_avg_sts": 0.7915679899923007, |
|
"eval_sickr_spearman": 0.7422913257230525, |
|
"eval_stsb_spearman": 0.8408446542615489, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"eval_avg_sts": 0.7924488788916606, |
|
"eval_sickr_spearman": 0.7431180370410052, |
|
"eval_stsb_spearman": 0.8417797207423161, |
|
"step": 19125 |
|
}, |
|
{ |
|
"epoch": 1.23, |
|
"eval_avg_sts": 0.7925131080137356, |
|
"eval_sickr_spearman": 0.7439811559338482, |
|
"eval_stsb_spearman": 0.8410450600936231, |
|
"step": 19250 |
|
}, |
|
{ |
|
"epoch": 1.24, |
|
"eval_avg_sts": 0.7923092664958495, |
|
"eval_sickr_spearman": 0.7438394641846057, |
|
"eval_stsb_spearman": 0.8407790688070933, |
|
"step": 19375 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"learning_rate": 2.632279534109817e-06, |
|
"loss": 0.0002, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"eval_avg_sts": 0.7915084313605771, |
|
"eval_sickr_spearman": 0.7429506966835948, |
|
"eval_stsb_spearman": 0.8400661660375595, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"eval_avg_sts": 0.7914848286255316, |
|
"eval_sickr_spearman": 0.7429546352339128, |
|
"eval_stsb_spearman": 0.8400150220171504, |
|
"step": 19625 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"eval_avg_sts": 0.7919444499131418, |
|
"eval_sickr_spearman": 0.7435056960607123, |
|
"eval_stsb_spearman": 0.8403832037655713, |
|
"step": 19750 |
|
}, |
|
{ |
|
"epoch": 1.27, |
|
"eval_avg_sts": 0.7918604283998938, |
|
"eval_sickr_spearman": 0.7430511777478034, |
|
"eval_stsb_spearman": 0.8406696790519842, |
|
"step": 19875 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"learning_rate": 2.5202867016510945e-06, |
|
"loss": 0.0001, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"eval_avg_sts": 0.7901084692338984, |
|
"eval_sickr_spearman": 0.7411617302794309, |
|
"eval_stsb_spearman": 0.839055208188366, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 1.29, |
|
"eval_avg_sts": 0.789757862825201, |
|
"eval_sickr_spearman": 0.7407969340640084, |
|
"eval_stsb_spearman": 0.8387187915863936, |
|
"step": 20125 |
|
}, |
|
{ |
|
"epoch": 1.3, |
|
"eval_avg_sts": 0.7898529068915039, |
|
"eval_sickr_spearman": 0.7409771947877056, |
|
"eval_stsb_spearman": 0.8387286189953022, |
|
"step": 20250 |
|
}, |
|
{ |
|
"epoch": 1.3, |
|
"eval_avg_sts": 0.789768082574833, |
|
"eval_sickr_spearman": 0.74083372588771, |
|
"eval_stsb_spearman": 0.838702439261956, |
|
"step": 20375 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"learning_rate": 2.4082938691923718e-06, |
|
"loss": 0.0, |
|
"step": 20500 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"eval_avg_sts": 0.7897954058339804, |
|
"eval_sickr_spearman": 0.7408093260881794, |
|
"eval_stsb_spearman": 0.8387814855797816, |
|
"step": 20500 |
|
}, |
|
{ |
|
"epoch": 1.32, |
|
"eval_avg_sts": 0.7899947832336973, |
|
"eval_sickr_spearman": 0.7409338707342086, |
|
"eval_stsb_spearman": 0.8390556957331861, |
|
"step": 20625 |
|
}, |
|
{ |
|
"epoch": 1.33, |
|
"eval_avg_sts": 0.790202509592782, |
|
"eval_sickr_spearman": 0.7411228731183674, |
|
"eval_stsb_spearman": 0.8392821460671965, |
|
"step": 20750 |
|
}, |
|
{ |
|
"epoch": 1.34, |
|
"eval_avg_sts": 0.7901906011266497, |
|
"eval_sickr_spearman": 0.7410648995789316, |
|
"eval_stsb_spearman": 0.839316302674368, |
|
"step": 20875 |
|
}, |
|
{ |
|
"epoch": 1.34, |
|
"learning_rate": 2.296301036733649e-06, |
|
"loss": 0.0, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 1.34, |
|
"eval_avg_sts": 0.7902077356957227, |
|
"eval_sickr_spearman": 0.7411439107407973, |
|
"eval_stsb_spearman": 0.839271560650648, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 1.35, |
|
"eval_avg_sts": 0.7901431265829444, |
|
"eval_sickr_spearman": 0.7410307494658092, |
|
"eval_stsb_spearman": 0.8392555037000796, |
|
"step": 21125 |
|
}, |
|
{ |
|
"epoch": 1.36, |
|
"eval_avg_sts": 0.7921962350985728, |
|
"eval_sickr_spearman": 0.7434804797324572, |
|
"eval_stsb_spearman": 0.8409119904646885, |
|
"step": 21250 |
|
}, |
|
{ |
|
"epoch": 1.37, |
|
"eval_avg_sts": 0.7922085580785473, |
|
"eval_sickr_spearman": 0.7434956095294102, |
|
"eval_stsb_spearman": 0.8409215066276844, |
|
"step": 21375 |
|
}, |
|
{ |
|
"epoch": 1.38, |
|
"learning_rate": 2.1843082042749267e-06, |
|
"loss": 0.0001, |
|
"step": 21500 |
|
}, |
|
{ |
|
"epoch": 1.38, |
|
"eval_avg_sts": 0.7922422656604595, |
|
"eval_sickr_spearman": 0.7434714018542854, |
|
"eval_stsb_spearman": 0.8410131294666336, |
|
"step": 21500 |
|
}, |
|
{ |
|
"epoch": 1.38, |
|
"eval_avg_sts": 0.7922953172658802, |
|
"eval_sickr_spearman": 0.7435230833194328, |
|
"eval_stsb_spearman": 0.8410675512123275, |
|
"step": 21625 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"eval_avg_sts": 0.7920827130593174, |
|
"eval_sickr_spearman": 0.7432143393993886, |
|
"eval_stsb_spearman": 0.8409510867192462, |
|
"step": 21750 |
|
}, |
|
{ |
|
"epoch": 1.4, |
|
"eval_avg_sts": 0.7893982619162593, |
|
"eval_sickr_spearman": 0.7409595673734778, |
|
"eval_stsb_spearman": 0.8378369564590408, |
|
"step": 21875 |
|
}, |
|
{ |
|
"epoch": 1.41, |
|
"learning_rate": 2.072315371816204e-06, |
|
"loss": 0.0002, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 1.41, |
|
"eval_avg_sts": 0.7906089294600861, |
|
"eval_sickr_spearman": 0.7422200475685182, |
|
"eval_stsb_spearman": 0.838997811351654, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 1.42, |
|
"eval_avg_sts": 0.7914097742253603, |
|
"eval_sickr_spearman": 0.7423016043787602, |
|
"eval_stsb_spearman": 0.8405179440719603, |
|
"step": 22125 |
|
}, |
|
{ |
|
"epoch": 1.42, |
|
"eval_avg_sts": 0.791727396078017, |
|
"eval_sickr_spearman": 0.7433686633283093, |
|
"eval_stsb_spearman": 0.8400861288277247, |
|
"step": 22250 |
|
}, |
|
{ |
|
"epoch": 1.43, |
|
"eval_avg_sts": 0.7914842385018235, |
|
"eval_sickr_spearman": 0.7423251876495663, |
|
"eval_stsb_spearman": 0.8406432893540806, |
|
"step": 22375 |
|
}, |
|
{ |
|
"epoch": 1.44, |
|
"learning_rate": 1.9603225393574807e-06, |
|
"loss": 0.0001, |
|
"step": 22500 |
|
}, |
|
{ |
|
"epoch": 1.44, |
|
"eval_avg_sts": 0.7915202710875588, |
|
"eval_sickr_spearman": 0.7422767242682152, |
|
"eval_stsb_spearman": 0.8407638179069024, |
|
"step": 22500 |
|
}, |
|
{ |
|
"epoch": 1.45, |
|
"eval_avg_sts": 0.7918702583757414, |
|
"eval_sickr_spearman": 0.7429271614438903, |
|
"eval_stsb_spearman": 0.8408133553075926, |
|
"step": 22625 |
|
}, |
|
{ |
|
"epoch": 1.46, |
|
"eval_avg_sts": 0.7916045718347005, |
|
"eval_sickr_spearman": 0.7425266300889978, |
|
"eval_stsb_spearman": 0.840682513580403, |
|
"step": 22750 |
|
}, |
|
{ |
|
"epoch": 1.46, |
|
"eval_avg_sts": 0.7915999641875153, |
|
"eval_sickr_spearman": 0.7422474733274393, |
|
"eval_stsb_spearman": 0.8409524550475914, |
|
"step": 22875 |
|
}, |
|
{ |
|
"epoch": 1.47, |
|
"learning_rate": 1.8483297068987584e-06, |
|
"loss": 0.0002, |
|
"step": 23000 |
|
}, |
|
{ |
|
"epoch": 1.47, |
|
"eval_avg_sts": 0.792815682844469, |
|
"eval_sickr_spearman": 0.7426967562502915, |
|
"eval_stsb_spearman": 0.8429346094386464, |
|
"step": 23000 |
|
}, |
|
{ |
|
"epoch": 1.48, |
|
"eval_avg_sts": 0.7927916857497739, |
|
"eval_sickr_spearman": 0.7425698100491905, |
|
"eval_stsb_spearman": 0.8430135614503571, |
|
"step": 23125 |
|
}, |
|
{ |
|
"epoch": 1.49, |
|
"eval_avg_sts": 0.7928345271530053, |
|
"eval_sickr_spearman": 0.7425940177243154, |
|
"eval_stsb_spearman": 0.8430750365816952, |
|
"step": 23250 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"eval_avg_sts": 0.7930442205998951, |
|
"eval_sickr_spearman": 0.7427970932211958, |
|
"eval_stsb_spearman": 0.8432913479785945, |
|
"step": 23375 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"learning_rate": 1.7363368744400357e-06, |
|
"loss": 0.0, |
|
"step": 23500 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"eval_avg_sts": 0.793033132084566, |
|
"eval_sickr_spearman": 0.7428263441619716, |
|
"eval_stsb_spearman": 0.8432399200071605, |
|
"step": 23500 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"eval_avg_sts": 0.7929242651260953, |
|
"eval_sickr_spearman": 0.7427599171486827, |
|
"eval_stsb_spearman": 0.8430886131035079, |
|
"step": 23625 |
|
}, |
|
{ |
|
"epoch": 1.52, |
|
"eval_avg_sts": 0.7936208486615127, |
|
"eval_sickr_spearman": 0.7430878254782006, |
|
"eval_stsb_spearman": 0.8441538718448248, |
|
"step": 23750 |
|
}, |
|
{ |
|
"epoch": 1.53, |
|
"eval_avg_sts": 0.7935886289185006, |
|
"eval_sickr_spearman": 0.7430728878056534, |
|
"eval_stsb_spearman": 0.8441043700313476, |
|
"step": 23875 |
|
}, |
|
{ |
|
"epoch": 1.54, |
|
"learning_rate": 1.6243440419813131e-06, |
|
"loss": 0.0001, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 1.54, |
|
"eval_avg_sts": 0.7935571381985222, |
|
"eval_sickr_spearman": 0.7430181323500139, |
|
"eval_stsb_spearman": 0.8440961440470305, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 1.54, |
|
"eval_avg_sts": 0.7935492855380204, |
|
"eval_sickr_spearman": 0.7430870569805776, |
|
"eval_stsb_spearman": 0.8440115140954632, |
|
"step": 24125 |
|
}, |
|
{ |
|
"epoch": 1.55, |
|
"eval_avg_sts": 0.7936128430055818, |
|
"eval_sickr_spearman": 0.7431491611947371, |
|
"eval_stsb_spearman": 0.8440765248164266, |
|
"step": 24250 |
|
}, |
|
{ |
|
"epoch": 1.56, |
|
"eval_avg_sts": 0.7936605492215507, |
|
"eval_sickr_spearman": 0.7432605933500736, |
|
"eval_stsb_spearman": 0.844060505093028, |
|
"step": 24375 |
|
}, |
|
{ |
|
"epoch": 1.57, |
|
"learning_rate": 1.5123512095225906e-06, |
|
"loss": 0.0, |
|
"step": 24500 |
|
}, |
|
{ |
|
"epoch": 1.57, |
|
"eval_avg_sts": 0.793667841726459, |
|
"eval_sickr_spearman": 0.7432775483288812, |
|
"eval_stsb_spearman": 0.8440581351240368, |
|
"step": 24500 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"eval_avg_sts": 0.7948942597846932, |
|
"eval_sickr_spearman": 0.744056468700903, |
|
"eval_stsb_spearman": 0.8457320508684834, |
|
"step": 24625 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"eval_avg_sts": 0.7948721522573494, |
|
"eval_sickr_spearman": 0.7440626647129885, |
|
"eval_stsb_spearman": 0.8456816398017104, |
|
"step": 24750 |
|
}, |
|
{ |
|
"epoch": 1.59, |
|
"eval_avg_sts": 0.7945095949089607, |
|
"eval_sickr_spearman": 0.7443504190417043, |
|
"eval_stsb_spearman": 0.8446687707762169, |
|
"step": 24875 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"learning_rate": 1.4003583770638678e-06, |
|
"loss": 0.0001, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"eval_avg_sts": 0.7947724077574231, |
|
"eval_sickr_spearman": 0.7446924004839437, |
|
"eval_stsb_spearman": 0.8448524150309025, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 1.61, |
|
"eval_avg_sts": 0.7959915253602992, |
|
"eval_sickr_spearman": 0.7461332854959857, |
|
"eval_stsb_spearman": 0.8458497652246126, |
|
"step": 25125 |
|
}, |
|
{ |
|
"epoch": 1.62, |
|
"eval_avg_sts": 0.7955281876289857, |
|
"eval_sickr_spearman": 0.7458754244134463, |
|
"eval_stsb_spearman": 0.845180950844525, |
|
"step": 25250 |
|
}, |
|
{ |
|
"epoch": 1.62, |
|
"eval_avg_sts": 0.79543745522762, |
|
"eval_sickr_spearman": 0.7456630610129066, |
|
"eval_stsb_spearman": 0.8452118494423333, |
|
"step": 25375 |
|
}, |
|
{ |
|
"epoch": 1.63, |
|
"learning_rate": 1.2883655446051453e-06, |
|
"loss": 0.0001, |
|
"step": 25500 |
|
}, |
|
{ |
|
"epoch": 1.63, |
|
"eval_avg_sts": 0.795353488562289, |
|
"eval_sickr_spearman": 0.7455269408714309, |
|
"eval_stsb_spearman": 0.8451800362531473, |
|
"step": 25500 |
|
}, |
|
{ |
|
"epoch": 1.64, |
|
"eval_avg_sts": 0.7953584932327289, |
|
"eval_sickr_spearman": 0.745271175256273, |
|
"eval_stsb_spearman": 0.8454458112091847, |
|
"step": 25625 |
|
}, |
|
{ |
|
"epoch": 1.65, |
|
"eval_avg_sts": 0.7953254322370598, |
|
"eval_sickr_spearman": 0.7452719917849974, |
|
"eval_stsb_spearman": 0.8453788726891222, |
|
"step": 25750 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"eval_avg_sts": 0.7952872018869009, |
|
"eval_sickr_spearman": 0.7452931735007315, |
|
"eval_stsb_spearman": 0.8452812302730703, |
|
"step": 25875 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"learning_rate": 1.1763727121464225e-06, |
|
"loss": 0.0001, |
|
"step": 26000 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"eval_avg_sts": 0.7952607086010879, |
|
"eval_sickr_spearman": 0.7453110410704665, |
|
"eval_stsb_spearman": 0.8452103761317094, |
|
"step": 26000 |
|
}, |
|
{ |
|
"epoch": 1.67, |
|
"eval_avg_sts": 0.7950903508557705, |
|
"eval_sickr_spearman": 0.7449656494200251, |
|
"eval_stsb_spearman": 0.8452150522915161, |
|
"step": 26125 |
|
}, |
|
{ |
|
"epoch": 1.68, |
|
"eval_avg_sts": 0.7950105822340711, |
|
"eval_sickr_spearman": 0.7448497023411534, |
|
"eval_stsb_spearman": 0.8451714621269887, |
|
"step": 26250 |
|
}, |
|
{ |
|
"epoch": 1.69, |
|
"eval_avg_sts": 0.7950131323560599, |
|
"eval_sickr_spearman": 0.744852055865124, |
|
"eval_stsb_spearman": 0.8451742088469958, |
|
"step": 26375 |
|
}, |
|
{ |
|
"epoch": 1.7, |
|
"learning_rate": 1.0643798796877e-06, |
|
"loss": 0.0001, |
|
"step": 26500 |
|
}, |
|
{ |
|
"epoch": 1.7, |
|
"eval_avg_sts": 0.7950484138603111, |
|
"eval_sickr_spearman": 0.7455690161162907, |
|
"eval_stsb_spearman": 0.8445278116043317, |
|
"step": 26500 |
|
}, |
|
{ |
|
"epoch": 1.7, |
|
"eval_avg_sts": 0.7950041615346236, |
|
"eval_sickr_spearman": 0.7455438958502385, |
|
"eval_stsb_spearman": 0.8444644272190087, |
|
"step": 26625 |
|
}, |
|
{ |
|
"epoch": 1.71, |
|
"eval_avg_sts": 0.7946972455858132, |
|
"eval_sickr_spearman": 0.745472569664603, |
|
"eval_stsb_spearman": 0.8439219215070236, |
|
"step": 26750 |
|
}, |
|
{ |
|
"epoch": 1.72, |
|
"eval_avg_sts": 0.7944591743219949, |
|
"eval_sickr_spearman": 0.7454866427773243, |
|
"eval_stsb_spearman": 0.8434317058666653, |
|
"step": 26875 |
|
}, |
|
{ |
|
"epoch": 1.73, |
|
"learning_rate": 9.523870472289774e-07, |
|
"loss": 0.0001, |
|
"step": 27000 |
|
}, |
|
{ |
|
"epoch": 1.73, |
|
"eval_avg_sts": 0.7944066177099748, |
|
"eval_sickr_spearman": 0.7454395722979149, |
|
"eval_stsb_spearman": 0.8433736631220347, |
|
"step": 27000 |
|
}, |
|
{ |
|
"epoch": 1.74, |
|
"eval_avg_sts": 0.7944436945207991, |
|
"eval_sickr_spearman": 0.7455328006658063, |
|
"eval_stsb_spearman": 0.8433545883757919, |
|
"step": 27125 |
|
}, |
|
{ |
|
"epoch": 1.74, |
|
"eval_avg_sts": 0.7944797298738457, |
|
"eval_sickr_spearman": 0.7455790065853898, |
|
"eval_stsb_spearman": 0.8433804531623017, |
|
"step": 27250 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"eval_avg_sts": 0.7944698737687554, |
|
"eval_sickr_spearman": 0.7455735310398258, |
|
"eval_stsb_spearman": 0.8433662164976851, |
|
"step": 27375 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"learning_rate": 8.403942147702547e-07, |
|
"loss": 0.0001, |
|
"step": 27500 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"eval_avg_sts": 0.7942514496393891, |
|
"eval_sickr_spearman": 0.74535724699005, |
|
"eval_stsb_spearman": 0.8431456522887281, |
|
"step": 27500 |
|
}, |
|
{ |
|
"epoch": 1.77, |
|
"eval_avg_sts": 0.7944530448391101, |
|
"eval_sickr_spearman": 0.7454611862935621, |
|
"eval_stsb_spearman": 0.8434449033846582, |
|
"step": 27625 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"eval_avg_sts": 0.7944670140899726, |
|
"eval_sickr_spearman": 0.7455168063090274, |
|
"eval_stsb_spearman": 0.8434172218709176, |
|
"step": 27750 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"eval_avg_sts": 0.7944968856863333, |
|
"eval_sickr_spearman": 0.7455487469914838, |
|
"eval_stsb_spearman": 0.8434450243811827, |
|
"step": 27875 |
|
}, |
|
{ |
|
"epoch": 1.79, |
|
"learning_rate": 7.284013823115321e-07, |
|
"loss": 0.0001, |
|
"step": 28000 |
|
}, |
|
{ |
|
"epoch": 1.79, |
|
"eval_avg_sts": 0.7944813522912897, |
|
"eval_sickr_spearman": 0.7459449555472468, |
|
"eval_stsb_spearman": 0.8430177490353326, |
|
"step": 28000 |
|
}, |
|
{ |
|
"epoch": 1.8, |
|
"eval_avg_sts": 0.7944717848510598, |
|
"eval_sickr_spearman": 0.7458816025244499, |
|
"eval_stsb_spearman": 0.8430619671776697, |
|
"step": 28125 |
|
}, |
|
{ |
|
"epoch": 1.81, |
|
"eval_avg_sts": 0.7943252967954475, |
|
"eval_sickr_spearman": 0.7455355384385883, |
|
"eval_stsb_spearman": 0.8431150551523066, |
|
"step": 28250 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"eval_avg_sts": 0.7945802673668048, |
|
"eval_sickr_spearman": 0.7459384233174512, |
|
"eval_stsb_spearman": 0.8432221114161584, |
|
"step": 28375 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"learning_rate": 6.164085498528094e-07, |
|
"loss": 0.0001, |
|
"step": 28500 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"eval_avg_sts": 0.7945695711998493, |
|
"eval_sickr_spearman": 0.7459346288604376, |
|
"eval_stsb_spearman": 0.843204513539261, |
|
"step": 28500 |
|
}, |
|
{ |
|
"epoch": 1.83, |
|
"eval_avg_sts": 0.7945396361578374, |
|
"eval_sickr_spearman": 0.7462354956798459, |
|
"eval_stsb_spearman": 0.8428437766358288, |
|
"step": 28625 |
|
}, |
|
{ |
|
"epoch": 1.84, |
|
"eval_avg_sts": 0.7944409539151067, |
|
"eval_sickr_spearman": 0.7461240814315593, |
|
"eval_stsb_spearman": 0.8427578263986542, |
|
"step": 28750 |
|
}, |
|
{ |
|
"epoch": 1.85, |
|
"eval_avg_sts": 0.7940565976087757, |
|
"eval_sickr_spearman": 0.7457283833108623, |
|
"eval_stsb_spearman": 0.8423848119066891, |
|
"step": 28875 |
|
}, |
|
{ |
|
"epoch": 1.86, |
|
"learning_rate": 5.044157173940868e-07, |
|
"loss": 0.0002, |
|
"step": 29000 |
|
}, |
|
{ |
|
"epoch": 1.86, |
|
"eval_avg_sts": 0.7940545279108154, |
|
"eval_sickr_spearman": 0.7457486524356691, |
|
"eval_stsb_spearman": 0.8423604033859617, |
|
"step": 29000 |
|
}, |
|
{ |
|
"epoch": 1.86, |
|
"eval_avg_sts": 0.7940541798236898, |
|
"eval_sickr_spearman": 0.7457327061099918, |
|
"eval_stsb_spearman": 0.8423756535373876, |
|
"step": 29125 |
|
}, |
|
{ |
|
"epoch": 1.87, |
|
"eval_avg_sts": 0.794045870127827, |
|
"eval_sickr_spearman": 0.7457254534136746, |
|
"eval_stsb_spearman": 0.8423662868419793, |
|
"step": 29250 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"eval_avg_sts": 0.7939439159521589, |
|
"eval_sickr_spearman": 0.7456850112262637, |
|
"eval_stsb_spearman": 0.8422028206780539, |
|
"step": 29375 |
|
}, |
|
{ |
|
"epoch": 1.89, |
|
"learning_rate": 3.9242288493536413e-07, |
|
"loss": 0.0001, |
|
"step": 29500 |
|
}, |
|
{ |
|
"epoch": 1.89, |
|
"eval_avg_sts": 0.7938843170635432, |
|
"eval_sickr_spearman": 0.7456857797238867, |
|
"eval_stsb_spearman": 0.8420828544031996, |
|
"step": 29500 |
|
}, |
|
{ |
|
"epoch": 1.9, |
|
"eval_avg_sts": 0.7938335370035037, |
|
"eval_sickr_spearman": 0.7456398619909119, |
|
"eval_stsb_spearman": 0.8420272120160953, |
|
"step": 29625 |
|
}, |
|
{ |
|
"epoch": 1.9, |
|
"eval_avg_sts": 0.7937791099281831, |
|
"eval_sickr_spearman": 0.7455667765481975, |
|
"eval_stsb_spearman": 0.8419914433081688, |
|
"step": 29750 |
|
}, |
|
{ |
|
"epoch": 1.91, |
|
"eval_avg_sts": 0.7937599626397398, |
|
"eval_sickr_spearman": 0.7455335691634293, |
|
"eval_stsb_spearman": 0.8419863561160503, |
|
"step": 29875 |
|
}, |
|
{ |
|
"epoch": 1.92, |
|
"learning_rate": 2.804300524766415e-07, |
|
"loss": 0.0001, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 1.92, |
|
"eval_avg_sts": 0.7937406443684292, |
|
"eval_sickr_spearman": 0.7454874593060488, |
|
"eval_stsb_spearman": 0.8419938294308097, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 1.93, |
|
"eval_avg_sts": 0.7939020781683644, |
|
"eval_sickr_spearman": 0.7457190652771832, |
|
"eval_stsb_spearman": 0.8420850910595457, |
|
"step": 30125 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_avg_sts": 0.7938812791358627, |
|
"eval_sickr_spearman": 0.7456977394681448, |
|
"eval_stsb_spearman": 0.8420648188035805, |
|
"step": 30250 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_avg_sts": 0.7937378630658074, |
|
"eval_sickr_spearman": 0.7454741066598489, |
|
"eval_stsb_spearman": 0.842001619471766, |
|
"step": 30375 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"learning_rate": 1.6843722001791884e-07, |
|
"loss": 0.0002, |
|
"step": 30500 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"eval_avg_sts": 0.7937467005092009, |
|
"eval_sickr_spearman": 0.7454940875980473, |
|
"eval_stsb_spearman": 0.8419993134203545, |
|
"step": 30500 |
|
}, |
|
{ |
|
"epoch": 1.96, |
|
"eval_avg_sts": 0.7937544654414969, |
|
"eval_sickr_spearman": 0.7454804467652388, |
|
"eval_stsb_spearman": 0.8420284841177549, |
|
"step": 30625 |
|
}, |
|
{ |
|
"epoch": 1.97, |
|
"eval_avg_sts": 0.7937753802718709, |
|
"eval_sickr_spearman": 0.7455158937181001, |
|
"eval_stsb_spearman": 0.8420348668256417, |
|
"step": 30750 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_avg_sts": 0.7937608907538469, |
|
"eval_sickr_spearman": 0.745488035679266, |
|
"eval_stsb_spearman": 0.8420337458284277, |
|
"step": 30875 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"learning_rate": 5.64443875591962e-08, |
|
"loss": 0.0001, |
|
"step": 31000 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_avg_sts": 0.7937471629995045, |
|
"eval_sickr_spearman": 0.7454658933415031, |
|
"eval_stsb_spearman": 0.8420284326575058, |
|
"step": 31000 |
|
}, |
|
{ |
|
"epoch": 1.99, |
|
"eval_avg_sts": 0.7937690011247767, |
|
"eval_sickr_spearman": 0.7455096977060146, |
|
"eval_stsb_spearman": 0.8420283045435387, |
|
"step": 31125 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_avg_sts": 0.7937804647459197, |
|
"eval_sickr_spearman": 0.7455530217595118, |
|
"eval_stsb_spearman": 0.8420079077323277, |
|
"step": 31250 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"step": 31252, |
|
"train_runtime": 9641.8618, |
|
"train_samples_per_second": 3.241 |
|
} |
|
], |
|
"max_steps": 31252, |
|
"num_train_epochs": 2, |
|
"total_flos": 333421219511531712, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|