{ "best_metric": 0.8548645464866416, "best_model_checkpoint": "result/InfoCSE-bert-base", "epoch": 2.0, "global_step": 31252, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "eval_avg_sts": 0.645032772395593, "eval_sickr_spearman": 0.6463705264094609, "eval_stsb_spearman": 0.643695018381725, "step": 125 }, { "epoch": 0.02, "eval_avg_sts": 0.685240727331801, "eval_sickr_spearman": 0.669725073110526, "eval_stsb_spearman": 0.700756381553076, "step": 250 }, { "epoch": 0.02, "eval_avg_sts": 0.7027556246143734, "eval_sickr_spearman": 0.6818145493736003, "eval_stsb_spearman": 0.7236966998551464, "step": 375 }, { "epoch": 0.03, "learning_rate": 6.888007167541277e-06, "loss": 0.0008, "step": 500 }, { "epoch": 0.03, "eval_avg_sts": 0.7085517582757557, "eval_sickr_spearman": 0.6868034438177743, "eval_stsb_spearman": 0.730300072733737, "step": 500 }, { "epoch": 0.04, "eval_avg_sts": 0.7152446421256347, "eval_sickr_spearman": 0.6908805158322469, "eval_stsb_spearman": 0.7396087684190223, "step": 625 }, { "epoch": 0.05, "eval_avg_sts": 0.744333698385975, "eval_sickr_spearman": 0.7107611650906991, "eval_stsb_spearman": 0.7779062316812507, "step": 750 }, { "epoch": 0.06, "eval_avg_sts": 0.749906268768782, "eval_sickr_spearman": 0.7164115438638786, "eval_stsb_spearman": 0.7834009936736853, "step": 875 }, { "epoch": 0.06, "learning_rate": 6.776014335082554e-06, "loss": 0.0003, "step": 1000 }, { "epoch": 0.06, "eval_avg_sts": 0.7527465185576756, "eval_sickr_spearman": 0.7194187230938174, "eval_stsb_spearman": 0.7860743140215339, "step": 1000 }, { "epoch": 0.07, "eval_avg_sts": 0.7563795190354858, "eval_sickr_spearman": 0.7197145466475747, "eval_stsb_spearman": 0.793044491423397, "step": 1125 }, { "epoch": 0.08, "eval_avg_sts": 0.7577088125126856, "eval_sickr_spearman": 0.7209790134240346, "eval_stsb_spearman": 0.7944386116013368, "step": 1250 }, { "epoch": 0.09, "eval_avg_sts": 0.7618327362445115, "eval_sickr_spearman": 0.7205304029366025, "eval_stsb_spearman": 0.8031350695524205, "step": 1375 }, { "epoch": 0.1, "learning_rate": 6.6640215026238325e-06, "loss": 0.0004, "step": 1500 }, { "epoch": 0.1, "eval_avg_sts": 0.7526454517508075, "eval_sickr_spearman": 0.7131317881332785, "eval_stsb_spearman": 0.7921591153683366, "step": 1500 }, { "epoch": 0.1, "eval_avg_sts": 0.7584465941723788, "eval_sickr_spearman": 0.7183862465373038, "eval_stsb_spearman": 0.798506941807454, "step": 1625 }, { "epoch": 0.11, "eval_avg_sts": 0.7600830398569421, "eval_sickr_spearman": 0.7199089285150947, "eval_stsb_spearman": 0.8002571511987896, "step": 1750 }, { "epoch": 0.12, "eval_avg_sts": 0.753643480678329, "eval_sickr_spearman": 0.7154178764373269, "eval_stsb_spearman": 0.7918690849193311, "step": 1875 }, { "epoch": 0.13, "learning_rate": 6.55202867016511e-06, "loss": 0.0002, "step": 2000 }, { "epoch": 0.13, "eval_avg_sts": 0.7563852037282979, "eval_sickr_spearman": 0.7193429780468495, "eval_stsb_spearman": 0.7934274294097461, "step": 2000 }, { "epoch": 0.14, "eval_avg_sts": 0.7664707372188553, "eval_sickr_spearman": 0.7240147231282276, "eval_stsb_spearman": 0.8089267513094829, "step": 2125 }, { "epoch": 0.14, "eval_avg_sts": 0.7706419135337745, "eval_sickr_spearman": 0.7288192261739805, "eval_stsb_spearman": 0.8124646008935686, "step": 2250 }, { "epoch": 0.15, "eval_avg_sts": 0.7712663844837009, "eval_sickr_spearman": 0.7299219242007967, "eval_stsb_spearman": 0.8126108447666052, "step": 2375 }, { "epoch": 0.16, "learning_rate": 6.440035837706387e-06, "loss": 0.0002, "step": 2500 }, { "epoch": 0.16, "eval_avg_sts": 0.7728606127631258, "eval_sickr_spearman": 0.7312590620337324, "eval_stsb_spearman": 0.8144621634925192, "step": 2500 }, { "epoch": 0.17, "eval_avg_sts": 0.7729813550763709, "eval_sickr_spearman": 0.7313422519014231, "eval_stsb_spearman": 0.8146204582513188, "step": 2625 }, { "epoch": 0.18, "eval_avg_sts": 0.7754932728462534, "eval_sickr_spearman": 0.7312568526030662, "eval_stsb_spearman": 0.8197296930894405, "step": 2750 }, { "epoch": 0.18, "eval_avg_sts": 0.7712885427125948, "eval_sickr_spearman": 0.7266254056157947, "eval_stsb_spearman": 0.8159516798093949, "step": 2875 }, { "epoch": 0.19, "learning_rate": 6.328043005247664e-06, "loss": 0.0002, "step": 3000 }, { "epoch": 0.19, "eval_avg_sts": 0.7716849957034901, "eval_sickr_spearman": 0.7262548936993011, "eval_stsb_spearman": 0.8171150977076791, "step": 3000 }, { "epoch": 0.2, "eval_avg_sts": 0.7711561198226983, "eval_sickr_spearman": 0.7262503241591916, "eval_stsb_spearman": 0.816061915486205, "step": 3125 }, { "epoch": 0.21, "eval_avg_sts": 0.7783568816799603, "eval_sickr_spearman": 0.7303159233258935, "eval_stsb_spearman": 0.8263978400340272, "step": 3250 }, { "epoch": 0.22, "eval_avg_sts": 0.7809228297940308, "eval_sickr_spearman": 0.7337628272894983, "eval_stsb_spearman": 0.8280828322985634, "step": 3375 }, { "epoch": 0.22, "learning_rate": 6.2160501727889415e-06, "loss": 0.0001, "step": 3500 }, { "epoch": 0.22, "eval_avg_sts": 0.7797812899347809, "eval_sickr_spearman": 0.7324181485736369, "eval_stsb_spearman": 0.8271444312959251, "step": 3500 }, { "epoch": 0.23, "eval_avg_sts": 0.780044187865891, "eval_sickr_spearman": 0.7338939041653229, "eval_stsb_spearman": 0.8261944715664592, "step": 3625 }, { "epoch": 0.24, "eval_avg_sts": 0.7787673562775448, "eval_sickr_spearman": 0.7328702653314738, "eval_stsb_spearman": 0.8246644472236156, "step": 3750 }, { "epoch": 0.25, "eval_avg_sts": 0.779541327716536, "eval_sickr_spearman": 0.7329598913667574, "eval_stsb_spearman": 0.8261227640663145, "step": 3875 }, { "epoch": 0.26, "learning_rate": 6.104057340330219e-06, "loss": 0.0003, "step": 4000 }, { "epoch": 0.26, "eval_avg_sts": 0.7747719384340315, "eval_sickr_spearman": 0.7285930957484098, "eval_stsb_spearman": 0.8209507811196531, "step": 4000 }, { "epoch": 0.26, "eval_avg_sts": 0.7765396311685044, "eval_sickr_spearman": 0.7301922912707919, "eval_stsb_spearman": 0.8228869710662171, "step": 4125 }, { "epoch": 0.27, "eval_avg_sts": 0.7728155845030844, "eval_sickr_spearman": 0.7257823156922516, "eval_stsb_spearman": 0.8198488533139171, "step": 4250 }, { "epoch": 0.28, "eval_avg_sts": 0.7734186821765212, "eval_sickr_spearman": 0.7266760303967105, "eval_stsb_spearman": 0.8201613339563318, "step": 4375 }, { "epoch": 0.29, "learning_rate": 5.992064507871497e-06, "loss": 0.0004, "step": 4500 }, { "epoch": 0.29, "eval_avg_sts": 0.7731296739509669, "eval_sickr_spearman": 0.7214541370794603, "eval_stsb_spearman": 0.8248052108224735, "step": 4500 }, { "epoch": 0.3, "eval_avg_sts": 0.7728203601265164, "eval_sickr_spearman": 0.7219969845879138, "eval_stsb_spearman": 0.8236437356651191, "step": 4625 }, { "epoch": 0.3, "eval_avg_sts": 0.773140320693449, "eval_sickr_spearman": 0.7226297943493609, "eval_stsb_spearman": 0.823650847037537, "step": 4750 }, { "epoch": 0.31, "eval_avg_sts": 0.7776841987101548, "eval_sickr_spearman": 0.7260857761911376, "eval_stsb_spearman": 0.8292826212291721, "step": 4875 }, { "epoch": 0.32, "learning_rate": 5.880071675412773e-06, "loss": 0.0001, "step": 5000 }, { "epoch": 0.32, "eval_avg_sts": 0.7787697170418183, "eval_sickr_spearman": 0.7268813633553585, "eval_stsb_spearman": 0.8306580707282781, "step": 5000 }, { "epoch": 0.33, "eval_avg_sts": 0.7794054673251014, "eval_sickr_spearman": 0.727022190544775, "eval_stsb_spearman": 0.8317887441054277, "step": 5125 }, { "epoch": 0.34, "eval_avg_sts": 0.7794784586068343, "eval_sickr_spearman": 0.7302013691489637, "eval_stsb_spearman": 0.8287555480647049, "step": 5250 }, { "epoch": 0.34, "eval_avg_sts": 0.7771717407788259, "eval_sickr_spearman": 0.7244288472848269, "eval_stsb_spearman": 0.829914634272825, "step": 5375 }, { "epoch": 0.35, "learning_rate": 5.7680788429540505e-06, "loss": 0.0003, "step": 5500 }, { "epoch": 0.35, "eval_avg_sts": 0.778478777290903, "eval_sickr_spearman": 0.7256252059594475, "eval_stsb_spearman": 0.8313323486223586, "step": 5500 }, { "epoch": 0.36, "eval_avg_sts": 0.7793214110914728, "eval_sickr_spearman": 0.726303453142855, "eval_stsb_spearman": 0.8323393690400904, "step": 5625 }, { "epoch": 0.37, "eval_avg_sts": 0.7791715295390024, "eval_sickr_spearman": 0.7257507592586067, "eval_stsb_spearman": 0.8325922998193981, "step": 5750 }, { "epoch": 0.38, "eval_avg_sts": 0.7800081020871235, "eval_sickr_spearman": 0.726603503433539, "eval_stsb_spearman": 0.8334127007407081, "step": 5875 }, { "epoch": 0.38, "learning_rate": 5.656086010495328e-06, "loss": 0.0001, "step": 6000 }, { "epoch": 0.38, "eval_avg_sts": 0.7802662913925068, "eval_sickr_spearman": 0.7272382344390437, "eval_stsb_spearman": 0.8332943483459699, "step": 6000 }, { "epoch": 0.39, "eval_avg_sts": 0.7788831909074992, "eval_sickr_spearman": 0.7254892779423776, "eval_stsb_spearman": 0.8322771038726209, "step": 6125 }, { "epoch": 0.4, "eval_avg_sts": 0.7790896526834474, "eval_sickr_spearman": 0.7246235173389557, "eval_stsb_spearman": 0.8335557880279391, "step": 6250 }, { "epoch": 0.41, "eval_avg_sts": 0.7811606337604482, "eval_sickr_spearman": 0.7249414832304759, "eval_stsb_spearman": 0.8373797842904204, "step": 6375 }, { "epoch": 0.42, "learning_rate": 5.544093178036605e-06, "loss": 0.0001, "step": 6500 }, { "epoch": 0.42, "eval_avg_sts": 0.7814213566702608, "eval_sickr_spearman": 0.7254279422258411, "eval_stsb_spearman": 0.8374147711146805, "step": 6500 }, { "epoch": 0.42, "eval_avg_sts": 0.7818500804137162, "eval_sickr_spearman": 0.726220023119657, "eval_stsb_spearman": 0.8374801377077753, "step": 6625 }, { "epoch": 0.43, "eval_avg_sts": 0.7832040571269738, "eval_sickr_spearman": 0.7301835015792287, "eval_stsb_spearman": 0.8362246126747188, "step": 6750 }, { "epoch": 0.44, "eval_avg_sts": 0.7841900708722672, "eval_sickr_spearman": 0.731056755034475, "eval_stsb_spearman": 0.8373233867100595, "step": 6875 }, { "epoch": 0.45, "learning_rate": 5.432100345577883e-06, "loss": 0.0001, "step": 7000 }, { "epoch": 0.45, "eval_avg_sts": 0.7862472754964975, "eval_sickr_spearman": 0.7333967342343369, "eval_stsb_spearman": 0.839097816758658, "step": 7000 }, { "epoch": 0.46, "eval_avg_sts": 0.7859634761320248, "eval_sickr_spearman": 0.7330241089493801, "eval_stsb_spearman": 0.8389028433146695, "step": 7125 }, { "epoch": 0.46, "eval_avg_sts": 0.7821803440191185, "eval_sickr_spearman": 0.7303841755210372, "eval_stsb_spearman": 0.8339765125171998, "step": 7250 }, { "epoch": 0.47, "eval_avg_sts": 0.7825744125697178, "eval_sickr_spearman": 0.7306357624303699, "eval_stsb_spearman": 0.8345130627090659, "step": 7375 }, { "epoch": 0.48, "learning_rate": 5.32010751311916e-06, "loss": 0.0001, "step": 7500 }, { "epoch": 0.48, "eval_avg_sts": 0.78116110534451, "eval_sickr_spearman": 0.7276775268927966, "eval_stsb_spearman": 0.8346446837962234, "step": 7500 }, { "epoch": 0.49, "eval_avg_sts": 0.7799908773501631, "eval_sickr_spearman": 0.7237501678215064, "eval_stsb_spearman": 0.83623158687882, "step": 7625 }, { "epoch": 0.5, "eval_avg_sts": 0.780269211830304, "eval_sickr_spearman": 0.7244608359983847, "eval_stsb_spearman": 0.8360775876622232, "step": 7750 }, { "epoch": 0.5, "eval_avg_sts": 0.7807594418954099, "eval_sickr_spearman": 0.7247573319875622, "eval_stsb_spearman": 0.8367615518032576, "step": 7875 }, { "epoch": 0.51, "learning_rate": 5.2081146806604376e-06, "loss": 0.0001, "step": 8000 }, { "epoch": 0.51, "eval_avg_sts": 0.7809657512161441, "eval_sickr_spearman": 0.7257775125821077, "eval_stsb_spearman": 0.8361539898501805, "step": 8000 }, { "epoch": 0.52, "eval_avg_sts": 0.7808305047079998, "eval_sickr_spearman": 0.7258256397457487, "eval_stsb_spearman": 0.8358353696702507, "step": 8125 }, { "epoch": 0.53, "eval_avg_sts": 0.7808244974473546, "eval_sickr_spearman": 0.7260765061885599, "eval_stsb_spearman": 0.8355724887061494, "step": 8250 }, { "epoch": 0.54, "eval_avg_sts": 0.7807531331871759, "eval_sickr_spearman": 0.725998455648723, "eval_stsb_spearman": 0.8355078107256287, "step": 8375 }, { "epoch": 0.54, "learning_rate": 5.096121848201715e-06, "loss": 0.0001, "step": 8500 }, { "epoch": 0.54, "eval_avg_sts": 0.7805553727181309, "eval_sickr_spearman": 0.7259074847425994, "eval_stsb_spearman": 0.8352032606936624, "step": 8500 }, { "epoch": 0.55, "eval_avg_sts": 0.7840901636781107, "eval_sickr_spearman": 0.727197936344937, "eval_stsb_spearman": 0.8409823910112844, "step": 8625 }, { "epoch": 0.56, "eval_avg_sts": 0.7841336470257416, "eval_sickr_spearman": 0.7241774524998998, "eval_stsb_spearman": 0.8440898415515834, "step": 8750 }, { "epoch": 0.57, "eval_avg_sts": 0.7848770188208263, "eval_sickr_spearman": 0.7246812987539857, "eval_stsb_spearman": 0.8450727388876668, "step": 8875 }, { "epoch": 0.58, "learning_rate": 4.984129015742992e-06, "loss": 0.0001, "step": 9000 }, { "epoch": 0.58, "eval_avg_sts": 0.7851602291221325, "eval_sickr_spearman": 0.7257603654788943, "eval_stsb_spearman": 0.8445600927653706, "step": 9000 }, { "epoch": 0.58, "eval_avg_sts": 0.7881113225894085, "eval_sickr_spearman": 0.7297208179790754, "eval_stsb_spearman": 0.8465018271997418, "step": 9125 }, { "epoch": 0.59, "eval_avg_sts": 0.7883865180777926, "eval_sickr_spearman": 0.7305029084037921, "eval_stsb_spearman": 0.8462701277517931, "step": 9250 }, { "epoch": 0.6, "eval_avg_sts": 0.7905936766250409, "eval_sickr_spearman": 0.7318727073857056, "eval_stsb_spearman": 0.8493146458643761, "step": 9375 }, { "epoch": 0.61, "learning_rate": 4.872136183284269e-06, "loss": 0.0002, "step": 9500 }, { "epoch": 0.61, "eval_avg_sts": 0.7894195399749903, "eval_sickr_spearman": 0.7297918559781024, "eval_stsb_spearman": 0.8490472239718782, "step": 9500 }, { "epoch": 0.62, "eval_avg_sts": 0.7888302258840285, "eval_sickr_spearman": 0.7290175946229199, "eval_stsb_spearman": 0.848642857145137, "step": 9625 }, { "epoch": 0.62, "eval_avg_sts": 0.7898168606884958, "eval_sickr_spearman": 0.7311126152054476, "eval_stsb_spearman": 0.848521106171544, "step": 9750 }, { "epoch": 0.63, "eval_avg_sts": 0.7916780015304804, "eval_sickr_spearman": 0.7336695508905056, "eval_stsb_spearman": 0.8496864521704552, "step": 9875 }, { "epoch": 0.64, "learning_rate": 4.760143350825547e-06, "loss": 0.0001, "step": 10000 }, { "epoch": 0.64, "eval_avg_sts": 0.7916349913886156, "eval_sickr_spearman": 0.7339293030870828, "eval_stsb_spearman": 0.8493406796901484, "step": 10000 }, { "epoch": 0.65, "eval_avg_sts": 0.791507759549186, "eval_sickr_spearman": 0.7339989962152694, "eval_stsb_spearman": 0.8490165228831026, "step": 10125 }, { "epoch": 0.66, "eval_avg_sts": 0.789931989918206, "eval_sickr_spearman": 0.7311775052234905, "eval_stsb_spearman": 0.8486864746129216, "step": 10250 }, { "epoch": 0.66, "eval_avg_sts": 0.7899616736779131, "eval_sickr_spearman": 0.7317643492208613, "eval_stsb_spearman": 0.8481589981349649, "step": 10375 }, { "epoch": 0.67, "learning_rate": 4.648150518366825e-06, "loss": 0.0001, "step": 10500 }, { "epoch": 0.67, "eval_avg_sts": 0.7926863693434811, "eval_sickr_spearman": 0.7347004424206716, "eval_stsb_spearman": 0.8506722962662906, "step": 10500 }, { "epoch": 0.68, "eval_avg_sts": 0.7925310701894714, "eval_sickr_spearman": 0.7345030826248625, "eval_stsb_spearman": 0.8505590577540805, "step": 10625 }, { "epoch": 0.69, "eval_avg_sts": 0.7921847237714013, "eval_sickr_spearman": 0.734286503995874, "eval_stsb_spearman": 0.8500829435469286, "step": 10750 }, { "epoch": 0.7, "eval_avg_sts": 0.792045037000692, "eval_sickr_spearman": 0.7345833425953655, "eval_stsb_spearman": 0.8495067314060183, "step": 10875 }, { "epoch": 0.7, "learning_rate": 4.536157685908102e-06, "loss": 0.0001, "step": 11000 }, { "epoch": 0.7, "eval_avg_sts": 0.7924996456713199, "eval_sickr_spearman": 0.7354074602338407, "eval_stsb_spearman": 0.8495918311087991, "step": 11000 }, { "epoch": 0.71, "eval_avg_sts": 0.7924266596358673, "eval_sickr_spearman": 0.7356516503535521, "eval_stsb_spearman": 0.8492016689181826, "step": 11125 }, { "epoch": 0.72, "eval_avg_sts": 0.7926706111519558, "eval_sickr_spearman": 0.7358917097985398, "eval_stsb_spearman": 0.8494495125053718, "step": 11250 }, { "epoch": 0.73, "eval_avg_sts": 0.7930288164708986, "eval_sickr_spearman": 0.7354914185991545, "eval_stsb_spearman": 0.8505662143426428, "step": 11375 }, { "epoch": 0.74, "learning_rate": 4.424164853449379e-06, "loss": 0.0002, "step": 11500 }, { "epoch": 0.74, "eval_avg_sts": 0.7926251189281965, "eval_sickr_spearman": 0.7351442017668584, "eval_stsb_spearman": 0.8501060360895348, "step": 11500 }, { "epoch": 0.74, "eval_avg_sts": 0.7932695687388167, "eval_sickr_spearman": 0.7365684199867013, "eval_stsb_spearman": 0.8499707174909322, "step": 11625 }, { "epoch": 0.75, "eval_avg_sts": 0.7935921856407616, "eval_sickr_spearman": 0.7367729844477262, "eval_stsb_spearman": 0.850411386833797, "step": 11750 }, { "epoch": 0.76, "eval_avg_sts": 0.794782209944985, "eval_sickr_spearman": 0.7389587838119719, "eval_stsb_spearman": 0.8506056360779983, "step": 11875 }, { "epoch": 0.77, "learning_rate": 4.312172020990656e-06, "loss": 0.0002, "step": 12000 }, { "epoch": 0.77, "eval_avg_sts": 0.7971707208949131, "eval_sickr_spearman": 0.7394768953031847, "eval_stsb_spearman": 0.8548645464866416, "step": 12000 }, { "epoch": 0.78, "eval_avg_sts": 0.797638118412404, "eval_sickr_spearman": 0.7421029957743136, "eval_stsb_spearman": 0.8531732410504944, "step": 12125 }, { "epoch": 0.78, "eval_avg_sts": 0.7969091025343611, "eval_sickr_spearman": 0.741429359576644, "eval_stsb_spearman": 0.8523888454920783, "step": 12250 }, { "epoch": 0.79, "eval_avg_sts": 0.7919648350492454, "eval_sickr_spearman": 0.7347034683800623, "eval_stsb_spearman": 0.8492262017184287, "step": 12375 }, { "epoch": 0.8, "learning_rate": 4.2001791885319345e-06, "loss": 0.0005, "step": 12500 }, { "epoch": 0.8, "eval_avg_sts": 0.7921636059370547, "eval_sickr_spearman": 0.7353516480939697, "eval_stsb_spearman": 0.8489755637801396, "step": 12500 }, { "epoch": 0.81, "eval_avg_sts": 0.7924202367929077, "eval_sickr_spearman": 0.736975675695795, "eval_stsb_spearman": 0.8478647978900204, "step": 12625 }, { "epoch": 0.82, "eval_avg_sts": 0.7890475112371416, "eval_sickr_spearman": 0.7355575093947334, "eval_stsb_spearman": 0.8425375130795496, "step": 12750 }, { "epoch": 0.82, "eval_avg_sts": 0.7892144058224184, "eval_sickr_spearman": 0.7356575101479275, "eval_stsb_spearman": 0.8427713014969095, "step": 12875 }, { "epoch": 0.83, "learning_rate": 4.088186356073212e-06, "loss": 0.0002, "step": 13000 }, { "epoch": 0.83, "eval_avg_sts": 0.7908518455947956, "eval_sickr_spearman": 0.73698621219475, "eval_stsb_spearman": 0.8447174789948412, "step": 13000 }, { "epoch": 0.84, "eval_avg_sts": 0.7910358332545967, "eval_sickr_spearman": 0.7372511340625426, "eval_stsb_spearman": 0.8448205324466508, "step": 13125 }, { "epoch": 0.85, "eval_avg_sts": 0.7910819619646265, "eval_sickr_spearman": 0.7366442130647706, "eval_stsb_spearman": 0.8455197108644826, "step": 13250 }, { "epoch": 0.86, "eval_avg_sts": 0.7913313391681369, "eval_sickr_spearman": 0.7369983463756739, "eval_stsb_spearman": 0.8456643319606, "step": 13375 }, { "epoch": 0.86, "learning_rate": 3.976193523614489e-06, "loss": 0.0002, "step": 13500 }, { "epoch": 0.86, "eval_avg_sts": 0.7912515138401426, "eval_sickr_spearman": 0.7371570411348254, "eval_stsb_spearman": 0.8453459865454599, "step": 13500 }, { "epoch": 0.87, "eval_avg_sts": 0.7912798783058242, "eval_sickr_spearman": 0.7375416261640404, "eval_stsb_spearman": 0.8450181304476081, "step": 13625 }, { "epoch": 0.88, "eval_avg_sts": 0.7915843291718891, "eval_sickr_spearman": 0.7376919154804402, "eval_stsb_spearman": 0.845476742863338, "step": 13750 }, { "epoch": 0.89, "eval_avg_sts": 0.7917255539871094, "eval_sickr_spearman": 0.7381062797925467, "eval_stsb_spearman": 0.8453448281816721, "step": 13875 }, { "epoch": 0.9, "learning_rate": 3.864200691155766e-06, "loss": 0.0001, "step": 14000 }, { "epoch": 0.9, "eval_avg_sts": 0.7916416194141285, "eval_sickr_spearman": 0.7380577683800943, "eval_stsb_spearman": 0.8452254704481627, "step": 14000 }, { "epoch": 0.9, "eval_avg_sts": 0.7924269371428458, "eval_sickr_spearman": 0.738714977941072, "eval_stsb_spearman": 0.8461388963446196, "step": 14125 }, { "epoch": 0.91, "eval_avg_sts": 0.7923356777507629, "eval_sickr_spearman": 0.7386597902055195, "eval_stsb_spearman": 0.8460115652960062, "step": 14250 }, { "epoch": 0.92, "eval_avg_sts": 0.7922805942330418, "eval_sickr_spearman": 0.7387613759850612, "eval_stsb_spearman": 0.8457998124810223, "step": 14375 }, { "epoch": 0.93, "learning_rate": 3.7522078586970435e-06, "loss": 0.0001, "step": 14500 }, { "epoch": 0.93, "eval_avg_sts": 0.7934966210957259, "eval_sickr_spearman": 0.7397510568301936, "eval_stsb_spearman": 0.8472421853612582, "step": 14500 }, { "epoch": 0.94, "eval_avg_sts": 0.7930449265696451, "eval_sickr_spearman": 0.7393639741837038, "eval_stsb_spearman": 0.8467258789555864, "step": 14625 }, { "epoch": 0.94, "eval_avg_sts": 0.7924737714972381, "eval_sickr_spearman": 0.7393996612920722, "eval_stsb_spearman": 0.845547881702404, "step": 14750 }, { "epoch": 0.95, "eval_avg_sts": 0.792308440851152, "eval_sickr_spearman": 0.739175211955052, "eval_stsb_spearman": 0.845441669747252, "step": 14875 }, { "epoch": 0.96, "learning_rate": 3.6402150262383203e-06, "loss": 0.0001, "step": 15000 }, { "epoch": 0.96, "eval_avg_sts": 0.7932488441451628, "eval_sickr_spearman": 0.7404715713828667, "eval_stsb_spearman": 0.8460261169074589, "step": 15000 }, { "epoch": 0.97, "eval_avg_sts": 0.7931158785146848, "eval_sickr_spearman": 0.7406130710077032, "eval_stsb_spearman": 0.8456186860216665, "step": 15125 }, { "epoch": 0.98, "eval_avg_sts": 0.7945903311020877, "eval_sickr_spearman": 0.7431428210893474, "eval_stsb_spearman": 0.8460378411148278, "step": 15250 }, { "epoch": 0.98, "eval_avg_sts": 0.7948596387785098, "eval_sickr_spearman": 0.7440196288461001, "eval_stsb_spearman": 0.8456996487109196, "step": 15375 }, { "epoch": 0.99, "learning_rate": 3.5282221937795976e-06, "loss": 0.0002, "step": 15500 }, { "epoch": 0.99, "eval_avg_sts": 0.7948372805541641, "eval_sickr_spearman": 0.744097679385937, "eval_stsb_spearman": 0.8455768817223914, "step": 15500 }, { "epoch": 1.0, "eval_avg_sts": 0.7937246352478757, "eval_sickr_spearman": 0.7439027691763012, "eval_stsb_spearman": 0.8435465013194503, "step": 15625 }, { "epoch": 1.01, "eval_avg_sts": 0.7937099307469273, "eval_sickr_spearman": 0.7440485435691657, "eval_stsb_spearman": 0.8433713179246888, "step": 15750 }, { "epoch": 1.02, "eval_avg_sts": 0.7935877720189825, "eval_sickr_spearman": 0.7440728953375949, "eval_stsb_spearman": 0.84310264870037, "step": 15875 }, { "epoch": 1.02, "learning_rate": 3.4162293613208757e-06, "loss": 0.0001, "step": 16000 }, { "epoch": 1.02, "eval_avg_sts": 0.7935863758797379, "eval_sickr_spearman": 0.744390621073608, "eval_stsb_spearman": 0.8427821306858677, "step": 16000 }, { "epoch": 1.03, "eval_avg_sts": 0.7937197747425322, "eval_sickr_spearman": 0.7444404293257993, "eval_stsb_spearman": 0.8429991201592651, "step": 16125 }, { "epoch": 1.04, "eval_avg_sts": 0.7924446512199308, "eval_sickr_spearman": 0.7440353830473717, "eval_stsb_spearman": 0.8408539193924898, "step": 16250 }, { "epoch": 1.05, "eval_avg_sts": 0.7905555822474897, "eval_sickr_spearman": 0.7383070017654566, "eval_stsb_spearman": 0.8428041627295226, "step": 16375 }, { "epoch": 1.06, "learning_rate": 3.304236528862153e-06, "loss": 0.0001, "step": 16500 }, { "epoch": 1.06, "eval_avg_sts": 0.7899406430528368, "eval_sickr_spearman": 0.737816219970962, "eval_stsb_spearman": 0.8420650661347118, "step": 16500 }, { "epoch": 1.06, "eval_avg_sts": 0.7921524290697161, "eval_sickr_spearman": 0.7417105816755641, "eval_stsb_spearman": 0.842594276463868, "step": 16625 }, { "epoch": 1.07, "eval_avg_sts": 0.7909061020892134, "eval_sickr_spearman": 0.7410022670226564, "eval_stsb_spearman": 0.8408099371557706, "step": 16750 }, { "epoch": 1.08, "eval_avg_sts": 0.7911860344103485, "eval_sickr_spearman": 0.7404902554813262, "eval_stsb_spearman": 0.841881813339371, "step": 16875 }, { "epoch": 1.09, "learning_rate": 3.19224369640343e-06, "loss": 0.0002, "step": 17000 }, { "epoch": 1.09, "eval_avg_sts": 0.7912332320403954, "eval_sickr_spearman": 0.7405556258103834, "eval_stsb_spearman": 0.8419108382704075, "step": 17000 }, { "epoch": 1.1, "eval_avg_sts": 0.791745368257589, "eval_sickr_spearman": 0.7407413620796446, "eval_stsb_spearman": 0.8427493744355335, "step": 17125 }, { "epoch": 1.1, "eval_avg_sts": 0.7936116457907827, "eval_sickr_spearman": 0.7417212926111849, "eval_stsb_spearman": 0.8455019989703806, "step": 17250 }, { "epoch": 1.11, "eval_avg_sts": 0.7936037695250758, "eval_sickr_spearman": 0.7418167304097425, "eval_stsb_spearman": 0.8453908086404092, "step": 17375 }, { "epoch": 1.12, "learning_rate": 3.0802508639447074e-06, "loss": 0.0002, "step": 17500 }, { "epoch": 1.12, "eval_avg_sts": 0.792413452164604, "eval_sickr_spearman": 0.7425937295377067, "eval_stsb_spearman": 0.8422331747915013, "step": 17500 }, { "epoch": 1.13, "eval_avg_sts": 0.7927184217670188, "eval_sickr_spearman": 0.7428243748868126, "eval_stsb_spearman": 0.8426124686472249, "step": 17625 }, { "epoch": 1.14, "eval_avg_sts": 0.7926960182448954, "eval_sickr_spearman": 0.742725526880053, "eval_stsb_spearman": 0.842666509609738, "step": 17750 }, { "epoch": 1.14, "eval_avg_sts": 0.7927521207425385, "eval_sickr_spearman": 0.7428051144151359, "eval_stsb_spearman": 0.8426991270699412, "step": 17875 }, { "epoch": 1.15, "learning_rate": 2.9682580314859847e-06, "loss": 0.0, "step": 18000 }, { "epoch": 1.15, "eval_avg_sts": 0.7928433137943678, "eval_sickr_spearman": 0.7426588116801555, "eval_stsb_spearman": 0.8430278159085801, "step": 18000 }, { "epoch": 1.16, "eval_avg_sts": 0.792833492411573, "eval_sickr_spearman": 0.7426310977346257, "eval_stsb_spearman": 0.8430358870885203, "step": 18125 }, { "epoch": 1.17, "eval_avg_sts": 0.7928841848486375, "eval_sickr_spearman": 0.742908285221025, "eval_stsb_spearman": 0.84286008447625, "step": 18250 }, { "epoch": 1.18, "eval_avg_sts": 0.7925150543842555, "eval_sickr_spearman": 0.743895084200071, "eval_stsb_spearman": 0.84113502456844, "step": 18375 }, { "epoch": 1.18, "learning_rate": 2.8562651990272623e-06, "loss": 0.0001, "step": 18500 }, { "epoch": 1.18, "eval_avg_sts": 0.7919487675309846, "eval_sickr_spearman": 0.7431525714029392, "eval_stsb_spearman": 0.84074496365903, "step": 18500 }, { "epoch": 1.19, "eval_avg_sts": 0.7919787220051326, "eval_sickr_spearman": 0.7432353770218185, "eval_stsb_spearman": 0.8407220669884469, "step": 18625 }, { "epoch": 1.2, "eval_avg_sts": 0.7920516311468476, "eval_sickr_spearman": 0.7433836010008565, "eval_stsb_spearman": 0.8407196612928387, "step": 18750 }, { "epoch": 1.21, "eval_avg_sts": 0.79208040900112, "eval_sickr_spearman": 0.7434916709790923, "eval_stsb_spearman": 0.8406691470231478, "step": 18875 }, { "epoch": 1.22, "learning_rate": 2.7442723665685396e-06, "loss": 0.0001, "step": 19000 }, { "epoch": 1.22, "eval_avg_sts": 0.7915679899923007, "eval_sickr_spearman": 0.7422913257230525, "eval_stsb_spearman": 0.8408446542615489, "step": 19000 }, { "epoch": 1.22, "eval_avg_sts": 0.7924488788916606, "eval_sickr_spearman": 0.7431180370410052, "eval_stsb_spearman": 0.8417797207423161, "step": 19125 }, { "epoch": 1.23, "eval_avg_sts": 0.7925131080137356, "eval_sickr_spearman": 0.7439811559338482, "eval_stsb_spearman": 0.8410450600936231, "step": 19250 }, { "epoch": 1.24, "eval_avg_sts": 0.7923092664958495, "eval_sickr_spearman": 0.7438394641846057, "eval_stsb_spearman": 0.8407790688070933, "step": 19375 }, { "epoch": 1.25, "learning_rate": 2.632279534109817e-06, "loss": 0.0002, "step": 19500 }, { "epoch": 1.25, "eval_avg_sts": 0.7915084313605771, "eval_sickr_spearman": 0.7429506966835948, "eval_stsb_spearman": 0.8400661660375595, "step": 19500 }, { "epoch": 1.26, "eval_avg_sts": 0.7914848286255316, "eval_sickr_spearman": 0.7429546352339128, "eval_stsb_spearman": 0.8400150220171504, "step": 19625 }, { "epoch": 1.26, "eval_avg_sts": 0.7919444499131418, "eval_sickr_spearman": 0.7435056960607123, "eval_stsb_spearman": 0.8403832037655713, "step": 19750 }, { "epoch": 1.27, "eval_avg_sts": 0.7918604283998938, "eval_sickr_spearman": 0.7430511777478034, "eval_stsb_spearman": 0.8406696790519842, "step": 19875 }, { "epoch": 1.28, "learning_rate": 2.5202867016510945e-06, "loss": 0.0001, "step": 20000 }, { "epoch": 1.28, "eval_avg_sts": 0.7901084692338984, "eval_sickr_spearman": 0.7411617302794309, "eval_stsb_spearman": 0.839055208188366, "step": 20000 }, { "epoch": 1.29, "eval_avg_sts": 0.789757862825201, "eval_sickr_spearman": 0.7407969340640084, "eval_stsb_spearman": 0.8387187915863936, "step": 20125 }, { "epoch": 1.3, "eval_avg_sts": 0.7898529068915039, "eval_sickr_spearman": 0.7409771947877056, "eval_stsb_spearman": 0.8387286189953022, "step": 20250 }, { "epoch": 1.3, "eval_avg_sts": 0.789768082574833, "eval_sickr_spearman": 0.74083372588771, "eval_stsb_spearman": 0.838702439261956, "step": 20375 }, { "epoch": 1.31, "learning_rate": 2.4082938691923718e-06, "loss": 0.0, "step": 20500 }, { "epoch": 1.31, "eval_avg_sts": 0.7897954058339804, "eval_sickr_spearman": 0.7408093260881794, "eval_stsb_spearman": 0.8387814855797816, "step": 20500 }, { "epoch": 1.32, "eval_avg_sts": 0.7899947832336973, "eval_sickr_spearman": 0.7409338707342086, "eval_stsb_spearman": 0.8390556957331861, "step": 20625 }, { "epoch": 1.33, "eval_avg_sts": 0.790202509592782, "eval_sickr_spearman": 0.7411228731183674, "eval_stsb_spearman": 0.8392821460671965, "step": 20750 }, { "epoch": 1.34, "eval_avg_sts": 0.7901906011266497, "eval_sickr_spearman": 0.7410648995789316, "eval_stsb_spearman": 0.839316302674368, "step": 20875 }, { "epoch": 1.34, "learning_rate": 2.296301036733649e-06, "loss": 0.0, "step": 21000 }, { "epoch": 1.34, "eval_avg_sts": 0.7902077356957227, "eval_sickr_spearman": 0.7411439107407973, "eval_stsb_spearman": 0.839271560650648, "step": 21000 }, { "epoch": 1.35, "eval_avg_sts": 0.7901431265829444, "eval_sickr_spearman": 0.7410307494658092, "eval_stsb_spearman": 0.8392555037000796, "step": 21125 }, { "epoch": 1.36, "eval_avg_sts": 0.7921962350985728, "eval_sickr_spearman": 0.7434804797324572, "eval_stsb_spearman": 0.8409119904646885, "step": 21250 }, { "epoch": 1.37, "eval_avg_sts": 0.7922085580785473, "eval_sickr_spearman": 0.7434956095294102, "eval_stsb_spearman": 0.8409215066276844, "step": 21375 }, { "epoch": 1.38, "learning_rate": 2.1843082042749267e-06, "loss": 0.0001, "step": 21500 }, { "epoch": 1.38, "eval_avg_sts": 0.7922422656604595, "eval_sickr_spearman": 0.7434714018542854, "eval_stsb_spearman": 0.8410131294666336, "step": 21500 }, { "epoch": 1.38, "eval_avg_sts": 0.7922953172658802, "eval_sickr_spearman": 0.7435230833194328, "eval_stsb_spearman": 0.8410675512123275, "step": 21625 }, { "epoch": 1.39, "eval_avg_sts": 0.7920827130593174, "eval_sickr_spearman": 0.7432143393993886, "eval_stsb_spearman": 0.8409510867192462, "step": 21750 }, { "epoch": 1.4, "eval_avg_sts": 0.7893982619162593, "eval_sickr_spearman": 0.7409595673734778, "eval_stsb_spearman": 0.8378369564590408, "step": 21875 }, { "epoch": 1.41, "learning_rate": 2.072315371816204e-06, "loss": 0.0002, "step": 22000 }, { "epoch": 1.41, "eval_avg_sts": 0.7906089294600861, "eval_sickr_spearman": 0.7422200475685182, "eval_stsb_spearman": 0.838997811351654, "step": 22000 }, { "epoch": 1.42, "eval_avg_sts": 0.7914097742253603, "eval_sickr_spearman": 0.7423016043787602, "eval_stsb_spearman": 0.8405179440719603, "step": 22125 }, { "epoch": 1.42, "eval_avg_sts": 0.791727396078017, "eval_sickr_spearman": 0.7433686633283093, "eval_stsb_spearman": 0.8400861288277247, "step": 22250 }, { "epoch": 1.43, "eval_avg_sts": 0.7914842385018235, "eval_sickr_spearman": 0.7423251876495663, "eval_stsb_spearman": 0.8406432893540806, "step": 22375 }, { "epoch": 1.44, "learning_rate": 1.9603225393574807e-06, "loss": 0.0001, "step": 22500 }, { "epoch": 1.44, "eval_avg_sts": 0.7915202710875588, "eval_sickr_spearman": 0.7422767242682152, "eval_stsb_spearman": 0.8407638179069024, "step": 22500 }, { "epoch": 1.45, "eval_avg_sts": 0.7918702583757414, "eval_sickr_spearman": 0.7429271614438903, "eval_stsb_spearman": 0.8408133553075926, "step": 22625 }, { "epoch": 1.46, "eval_avg_sts": 0.7916045718347005, "eval_sickr_spearman": 0.7425266300889978, "eval_stsb_spearman": 0.840682513580403, "step": 22750 }, { "epoch": 1.46, "eval_avg_sts": 0.7915999641875153, "eval_sickr_spearman": 0.7422474733274393, "eval_stsb_spearman": 0.8409524550475914, "step": 22875 }, { "epoch": 1.47, "learning_rate": 1.8483297068987584e-06, "loss": 0.0002, "step": 23000 }, { "epoch": 1.47, "eval_avg_sts": 0.792815682844469, "eval_sickr_spearman": 0.7426967562502915, "eval_stsb_spearman": 0.8429346094386464, "step": 23000 }, { "epoch": 1.48, "eval_avg_sts": 0.7927916857497739, "eval_sickr_spearman": 0.7425698100491905, "eval_stsb_spearman": 0.8430135614503571, "step": 23125 }, { "epoch": 1.49, "eval_avg_sts": 0.7928345271530053, "eval_sickr_spearman": 0.7425940177243154, "eval_stsb_spearman": 0.8430750365816952, "step": 23250 }, { "epoch": 1.5, "eval_avg_sts": 0.7930442205998951, "eval_sickr_spearman": 0.7427970932211958, "eval_stsb_spearman": 0.8432913479785945, "step": 23375 }, { "epoch": 1.5, "learning_rate": 1.7363368744400357e-06, "loss": 0.0, "step": 23500 }, { "epoch": 1.5, "eval_avg_sts": 0.793033132084566, "eval_sickr_spearman": 0.7428263441619716, "eval_stsb_spearman": 0.8432399200071605, "step": 23500 }, { "epoch": 1.51, "eval_avg_sts": 0.7929242651260953, "eval_sickr_spearman": 0.7427599171486827, "eval_stsb_spearman": 0.8430886131035079, "step": 23625 }, { "epoch": 1.52, "eval_avg_sts": 0.7936208486615127, "eval_sickr_spearman": 0.7430878254782006, "eval_stsb_spearman": 0.8441538718448248, "step": 23750 }, { "epoch": 1.53, "eval_avg_sts": 0.7935886289185006, "eval_sickr_spearman": 0.7430728878056534, "eval_stsb_spearman": 0.8441043700313476, "step": 23875 }, { "epoch": 1.54, "learning_rate": 1.6243440419813131e-06, "loss": 0.0001, "step": 24000 }, { "epoch": 1.54, "eval_avg_sts": 0.7935571381985222, "eval_sickr_spearman": 0.7430181323500139, "eval_stsb_spearman": 0.8440961440470305, "step": 24000 }, { "epoch": 1.54, "eval_avg_sts": 0.7935492855380204, "eval_sickr_spearman": 0.7430870569805776, "eval_stsb_spearman": 0.8440115140954632, "step": 24125 }, { "epoch": 1.55, "eval_avg_sts": 0.7936128430055818, "eval_sickr_spearman": 0.7431491611947371, "eval_stsb_spearman": 0.8440765248164266, "step": 24250 }, { "epoch": 1.56, "eval_avg_sts": 0.7936605492215507, "eval_sickr_spearman": 0.7432605933500736, "eval_stsb_spearman": 0.844060505093028, "step": 24375 }, { "epoch": 1.57, "learning_rate": 1.5123512095225906e-06, "loss": 0.0, "step": 24500 }, { "epoch": 1.57, "eval_avg_sts": 0.793667841726459, "eval_sickr_spearman": 0.7432775483288812, "eval_stsb_spearman": 0.8440581351240368, "step": 24500 }, { "epoch": 1.58, "eval_avg_sts": 0.7948942597846932, "eval_sickr_spearman": 0.744056468700903, "eval_stsb_spearman": 0.8457320508684834, "step": 24625 }, { "epoch": 1.58, "eval_avg_sts": 0.7948721522573494, "eval_sickr_spearman": 0.7440626647129885, "eval_stsb_spearman": 0.8456816398017104, "step": 24750 }, { "epoch": 1.59, "eval_avg_sts": 0.7945095949089607, "eval_sickr_spearman": 0.7443504190417043, "eval_stsb_spearman": 0.8446687707762169, "step": 24875 }, { "epoch": 1.6, "learning_rate": 1.4003583770638678e-06, "loss": 0.0001, "step": 25000 }, { "epoch": 1.6, "eval_avg_sts": 0.7947724077574231, "eval_sickr_spearman": 0.7446924004839437, "eval_stsb_spearman": 0.8448524150309025, "step": 25000 }, { "epoch": 1.61, "eval_avg_sts": 0.7959915253602992, "eval_sickr_spearman": 0.7461332854959857, "eval_stsb_spearman": 0.8458497652246126, "step": 25125 }, { "epoch": 1.62, "eval_avg_sts": 0.7955281876289857, "eval_sickr_spearman": 0.7458754244134463, "eval_stsb_spearman": 0.845180950844525, "step": 25250 }, { "epoch": 1.62, "eval_avg_sts": 0.79543745522762, "eval_sickr_spearman": 0.7456630610129066, "eval_stsb_spearman": 0.8452118494423333, "step": 25375 }, { "epoch": 1.63, "learning_rate": 1.2883655446051453e-06, "loss": 0.0001, "step": 25500 }, { "epoch": 1.63, "eval_avg_sts": 0.795353488562289, "eval_sickr_spearman": 0.7455269408714309, "eval_stsb_spearman": 0.8451800362531473, "step": 25500 }, { "epoch": 1.64, "eval_avg_sts": 0.7953584932327289, "eval_sickr_spearman": 0.745271175256273, "eval_stsb_spearman": 0.8454458112091847, "step": 25625 }, { "epoch": 1.65, "eval_avg_sts": 0.7953254322370598, "eval_sickr_spearman": 0.7452719917849974, "eval_stsb_spearman": 0.8453788726891222, "step": 25750 }, { "epoch": 1.66, "eval_avg_sts": 0.7952872018869009, "eval_sickr_spearman": 0.7452931735007315, "eval_stsb_spearman": 0.8452812302730703, "step": 25875 }, { "epoch": 1.66, "learning_rate": 1.1763727121464225e-06, "loss": 0.0001, "step": 26000 }, { "epoch": 1.66, "eval_avg_sts": 0.7952607086010879, "eval_sickr_spearman": 0.7453110410704665, "eval_stsb_spearman": 0.8452103761317094, "step": 26000 }, { "epoch": 1.67, "eval_avg_sts": 0.7950903508557705, "eval_sickr_spearman": 0.7449656494200251, "eval_stsb_spearman": 0.8452150522915161, "step": 26125 }, { "epoch": 1.68, "eval_avg_sts": 0.7950105822340711, "eval_sickr_spearman": 0.7448497023411534, "eval_stsb_spearman": 0.8451714621269887, "step": 26250 }, { "epoch": 1.69, "eval_avg_sts": 0.7950131323560599, "eval_sickr_spearman": 0.744852055865124, "eval_stsb_spearman": 0.8451742088469958, "step": 26375 }, { "epoch": 1.7, "learning_rate": 1.0643798796877e-06, "loss": 0.0001, "step": 26500 }, { "epoch": 1.7, "eval_avg_sts": 0.7950484138603111, "eval_sickr_spearman": 0.7455690161162907, "eval_stsb_spearman": 0.8445278116043317, "step": 26500 }, { "epoch": 1.7, "eval_avg_sts": 0.7950041615346236, "eval_sickr_spearman": 0.7455438958502385, "eval_stsb_spearman": 0.8444644272190087, "step": 26625 }, { "epoch": 1.71, "eval_avg_sts": 0.7946972455858132, "eval_sickr_spearman": 0.745472569664603, "eval_stsb_spearman": 0.8439219215070236, "step": 26750 }, { "epoch": 1.72, "eval_avg_sts": 0.7944591743219949, "eval_sickr_spearman": 0.7454866427773243, "eval_stsb_spearman": 0.8434317058666653, "step": 26875 }, { "epoch": 1.73, "learning_rate": 9.523870472289774e-07, "loss": 0.0001, "step": 27000 }, { "epoch": 1.73, "eval_avg_sts": 0.7944066177099748, "eval_sickr_spearman": 0.7454395722979149, "eval_stsb_spearman": 0.8433736631220347, "step": 27000 }, { "epoch": 1.74, "eval_avg_sts": 0.7944436945207991, "eval_sickr_spearman": 0.7455328006658063, "eval_stsb_spearman": 0.8433545883757919, "step": 27125 }, { "epoch": 1.74, "eval_avg_sts": 0.7944797298738457, "eval_sickr_spearman": 0.7455790065853898, "eval_stsb_spearman": 0.8433804531623017, "step": 27250 }, { "epoch": 1.75, "eval_avg_sts": 0.7944698737687554, "eval_sickr_spearman": 0.7455735310398258, "eval_stsb_spearman": 0.8433662164976851, "step": 27375 }, { "epoch": 1.76, "learning_rate": 8.403942147702547e-07, "loss": 0.0001, "step": 27500 }, { "epoch": 1.76, "eval_avg_sts": 0.7942514496393891, "eval_sickr_spearman": 0.74535724699005, "eval_stsb_spearman": 0.8431456522887281, "step": 27500 }, { "epoch": 1.77, "eval_avg_sts": 0.7944530448391101, "eval_sickr_spearman": 0.7454611862935621, "eval_stsb_spearman": 0.8434449033846582, "step": 27625 }, { "epoch": 1.78, "eval_avg_sts": 0.7944670140899726, "eval_sickr_spearman": 0.7455168063090274, "eval_stsb_spearman": 0.8434172218709176, "step": 27750 }, { "epoch": 1.78, "eval_avg_sts": 0.7944968856863333, "eval_sickr_spearman": 0.7455487469914838, "eval_stsb_spearman": 0.8434450243811827, "step": 27875 }, { "epoch": 1.79, "learning_rate": 7.284013823115321e-07, "loss": 0.0001, "step": 28000 }, { "epoch": 1.79, "eval_avg_sts": 0.7944813522912897, "eval_sickr_spearman": 0.7459449555472468, "eval_stsb_spearman": 0.8430177490353326, "step": 28000 }, { "epoch": 1.8, "eval_avg_sts": 0.7944717848510598, "eval_sickr_spearman": 0.7458816025244499, "eval_stsb_spearman": 0.8430619671776697, "step": 28125 }, { "epoch": 1.81, "eval_avg_sts": 0.7943252967954475, "eval_sickr_spearman": 0.7455355384385883, "eval_stsb_spearman": 0.8431150551523066, "step": 28250 }, { "epoch": 1.82, "eval_avg_sts": 0.7945802673668048, "eval_sickr_spearman": 0.7459384233174512, "eval_stsb_spearman": 0.8432221114161584, "step": 28375 }, { "epoch": 1.82, "learning_rate": 6.164085498528094e-07, "loss": 0.0001, "step": 28500 }, { "epoch": 1.82, "eval_avg_sts": 0.7945695711998493, "eval_sickr_spearman": 0.7459346288604376, "eval_stsb_spearman": 0.843204513539261, "step": 28500 }, { "epoch": 1.83, "eval_avg_sts": 0.7945396361578374, "eval_sickr_spearman": 0.7462354956798459, "eval_stsb_spearman": 0.8428437766358288, "step": 28625 }, { "epoch": 1.84, "eval_avg_sts": 0.7944409539151067, "eval_sickr_spearman": 0.7461240814315593, "eval_stsb_spearman": 0.8427578263986542, "step": 28750 }, { "epoch": 1.85, "eval_avg_sts": 0.7940565976087757, "eval_sickr_spearman": 0.7457283833108623, "eval_stsb_spearman": 0.8423848119066891, "step": 28875 }, { "epoch": 1.86, "learning_rate": 5.044157173940868e-07, "loss": 0.0002, "step": 29000 }, { "epoch": 1.86, "eval_avg_sts": 0.7940545279108154, "eval_sickr_spearman": 0.7457486524356691, "eval_stsb_spearman": 0.8423604033859617, "step": 29000 }, { "epoch": 1.86, "eval_avg_sts": 0.7940541798236898, "eval_sickr_spearman": 0.7457327061099918, "eval_stsb_spearman": 0.8423756535373876, "step": 29125 }, { "epoch": 1.87, "eval_avg_sts": 0.794045870127827, "eval_sickr_spearman": 0.7457254534136746, "eval_stsb_spearman": 0.8423662868419793, "step": 29250 }, { "epoch": 1.88, "eval_avg_sts": 0.7939439159521589, "eval_sickr_spearman": 0.7456850112262637, "eval_stsb_spearman": 0.8422028206780539, "step": 29375 }, { "epoch": 1.89, "learning_rate": 3.9242288493536413e-07, "loss": 0.0001, "step": 29500 }, { "epoch": 1.89, "eval_avg_sts": 0.7938843170635432, "eval_sickr_spearman": 0.7456857797238867, "eval_stsb_spearman": 0.8420828544031996, "step": 29500 }, { "epoch": 1.9, "eval_avg_sts": 0.7938335370035037, "eval_sickr_spearman": 0.7456398619909119, "eval_stsb_spearman": 0.8420272120160953, "step": 29625 }, { "epoch": 1.9, "eval_avg_sts": 0.7937791099281831, "eval_sickr_spearman": 0.7455667765481975, "eval_stsb_spearman": 0.8419914433081688, "step": 29750 }, { "epoch": 1.91, "eval_avg_sts": 0.7937599626397398, "eval_sickr_spearman": 0.7455335691634293, "eval_stsb_spearman": 0.8419863561160503, "step": 29875 }, { "epoch": 1.92, "learning_rate": 2.804300524766415e-07, "loss": 0.0001, "step": 30000 }, { "epoch": 1.92, "eval_avg_sts": 0.7937406443684292, "eval_sickr_spearman": 0.7454874593060488, "eval_stsb_spearman": 0.8419938294308097, "step": 30000 }, { "epoch": 1.93, "eval_avg_sts": 0.7939020781683644, "eval_sickr_spearman": 0.7457190652771832, "eval_stsb_spearman": 0.8420850910595457, "step": 30125 }, { "epoch": 1.94, "eval_avg_sts": 0.7938812791358627, "eval_sickr_spearman": 0.7456977394681448, "eval_stsb_spearman": 0.8420648188035805, "step": 30250 }, { "epoch": 1.94, "eval_avg_sts": 0.7937378630658074, "eval_sickr_spearman": 0.7454741066598489, "eval_stsb_spearman": 0.842001619471766, "step": 30375 }, { "epoch": 1.95, "learning_rate": 1.6843722001791884e-07, "loss": 0.0002, "step": 30500 }, { "epoch": 1.95, "eval_avg_sts": 0.7937467005092009, "eval_sickr_spearman": 0.7454940875980473, "eval_stsb_spearman": 0.8419993134203545, "step": 30500 }, { "epoch": 1.96, "eval_avg_sts": 0.7937544654414969, "eval_sickr_spearman": 0.7454804467652388, "eval_stsb_spearman": 0.8420284841177549, "step": 30625 }, { "epoch": 1.97, "eval_avg_sts": 0.7937753802718709, "eval_sickr_spearman": 0.7455158937181001, "eval_stsb_spearman": 0.8420348668256417, "step": 30750 }, { "epoch": 1.98, "eval_avg_sts": 0.7937608907538469, "eval_sickr_spearman": 0.745488035679266, "eval_stsb_spearman": 0.8420337458284277, "step": 30875 }, { "epoch": 1.98, "learning_rate": 5.64443875591962e-08, "loss": 0.0001, "step": 31000 }, { "epoch": 1.98, "eval_avg_sts": 0.7937471629995045, "eval_sickr_spearman": 0.7454658933415031, "eval_stsb_spearman": 0.8420284326575058, "step": 31000 }, { "epoch": 1.99, "eval_avg_sts": 0.7937690011247767, "eval_sickr_spearman": 0.7455096977060146, "eval_stsb_spearman": 0.8420283045435387, "step": 31125 }, { "epoch": 2.0, "eval_avg_sts": 0.7937804647459197, "eval_sickr_spearman": 0.7455530217595118, "eval_stsb_spearman": 0.8420079077323277, "step": 31250 }, { "epoch": 2.0, "step": 31252, "train_runtime": 9641.8618, "train_samples_per_second": 3.241 } ], "max_steps": 31252, "num_train_epochs": 2, "total_flos": 333421219511531712, "trial_name": null, "trial_params": null }