InfoCSE-bert-base / trainer_state.json
root
init
defdc43
{
"best_metric": 0.8548645464866416,
"best_model_checkpoint": "result/InfoCSE-bert-base",
"epoch": 2.0,
"global_step": 31252,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"eval_avg_sts": 0.645032772395593,
"eval_sickr_spearman": 0.6463705264094609,
"eval_stsb_spearman": 0.643695018381725,
"step": 125
},
{
"epoch": 0.02,
"eval_avg_sts": 0.685240727331801,
"eval_sickr_spearman": 0.669725073110526,
"eval_stsb_spearman": 0.700756381553076,
"step": 250
},
{
"epoch": 0.02,
"eval_avg_sts": 0.7027556246143734,
"eval_sickr_spearman": 0.6818145493736003,
"eval_stsb_spearman": 0.7236966998551464,
"step": 375
},
{
"epoch": 0.03,
"learning_rate": 6.888007167541277e-06,
"loss": 0.0008,
"step": 500
},
{
"epoch": 0.03,
"eval_avg_sts": 0.7085517582757557,
"eval_sickr_spearman": 0.6868034438177743,
"eval_stsb_spearman": 0.730300072733737,
"step": 500
},
{
"epoch": 0.04,
"eval_avg_sts": 0.7152446421256347,
"eval_sickr_spearman": 0.6908805158322469,
"eval_stsb_spearman": 0.7396087684190223,
"step": 625
},
{
"epoch": 0.05,
"eval_avg_sts": 0.744333698385975,
"eval_sickr_spearman": 0.7107611650906991,
"eval_stsb_spearman": 0.7779062316812507,
"step": 750
},
{
"epoch": 0.06,
"eval_avg_sts": 0.749906268768782,
"eval_sickr_spearman": 0.7164115438638786,
"eval_stsb_spearman": 0.7834009936736853,
"step": 875
},
{
"epoch": 0.06,
"learning_rate": 6.776014335082554e-06,
"loss": 0.0003,
"step": 1000
},
{
"epoch": 0.06,
"eval_avg_sts": 0.7527465185576756,
"eval_sickr_spearman": 0.7194187230938174,
"eval_stsb_spearman": 0.7860743140215339,
"step": 1000
},
{
"epoch": 0.07,
"eval_avg_sts": 0.7563795190354858,
"eval_sickr_spearman": 0.7197145466475747,
"eval_stsb_spearman": 0.793044491423397,
"step": 1125
},
{
"epoch": 0.08,
"eval_avg_sts": 0.7577088125126856,
"eval_sickr_spearman": 0.7209790134240346,
"eval_stsb_spearman": 0.7944386116013368,
"step": 1250
},
{
"epoch": 0.09,
"eval_avg_sts": 0.7618327362445115,
"eval_sickr_spearman": 0.7205304029366025,
"eval_stsb_spearman": 0.8031350695524205,
"step": 1375
},
{
"epoch": 0.1,
"learning_rate": 6.6640215026238325e-06,
"loss": 0.0004,
"step": 1500
},
{
"epoch": 0.1,
"eval_avg_sts": 0.7526454517508075,
"eval_sickr_spearman": 0.7131317881332785,
"eval_stsb_spearman": 0.7921591153683366,
"step": 1500
},
{
"epoch": 0.1,
"eval_avg_sts": 0.7584465941723788,
"eval_sickr_spearman": 0.7183862465373038,
"eval_stsb_spearman": 0.798506941807454,
"step": 1625
},
{
"epoch": 0.11,
"eval_avg_sts": 0.7600830398569421,
"eval_sickr_spearman": 0.7199089285150947,
"eval_stsb_spearman": 0.8002571511987896,
"step": 1750
},
{
"epoch": 0.12,
"eval_avg_sts": 0.753643480678329,
"eval_sickr_spearman": 0.7154178764373269,
"eval_stsb_spearman": 0.7918690849193311,
"step": 1875
},
{
"epoch": 0.13,
"learning_rate": 6.55202867016511e-06,
"loss": 0.0002,
"step": 2000
},
{
"epoch": 0.13,
"eval_avg_sts": 0.7563852037282979,
"eval_sickr_spearman": 0.7193429780468495,
"eval_stsb_spearman": 0.7934274294097461,
"step": 2000
},
{
"epoch": 0.14,
"eval_avg_sts": 0.7664707372188553,
"eval_sickr_spearman": 0.7240147231282276,
"eval_stsb_spearman": 0.8089267513094829,
"step": 2125
},
{
"epoch": 0.14,
"eval_avg_sts": 0.7706419135337745,
"eval_sickr_spearman": 0.7288192261739805,
"eval_stsb_spearman": 0.8124646008935686,
"step": 2250
},
{
"epoch": 0.15,
"eval_avg_sts": 0.7712663844837009,
"eval_sickr_spearman": 0.7299219242007967,
"eval_stsb_spearman": 0.8126108447666052,
"step": 2375
},
{
"epoch": 0.16,
"learning_rate": 6.440035837706387e-06,
"loss": 0.0002,
"step": 2500
},
{
"epoch": 0.16,
"eval_avg_sts": 0.7728606127631258,
"eval_sickr_spearman": 0.7312590620337324,
"eval_stsb_spearman": 0.8144621634925192,
"step": 2500
},
{
"epoch": 0.17,
"eval_avg_sts": 0.7729813550763709,
"eval_sickr_spearman": 0.7313422519014231,
"eval_stsb_spearman": 0.8146204582513188,
"step": 2625
},
{
"epoch": 0.18,
"eval_avg_sts": 0.7754932728462534,
"eval_sickr_spearman": 0.7312568526030662,
"eval_stsb_spearman": 0.8197296930894405,
"step": 2750
},
{
"epoch": 0.18,
"eval_avg_sts": 0.7712885427125948,
"eval_sickr_spearman": 0.7266254056157947,
"eval_stsb_spearman": 0.8159516798093949,
"step": 2875
},
{
"epoch": 0.19,
"learning_rate": 6.328043005247664e-06,
"loss": 0.0002,
"step": 3000
},
{
"epoch": 0.19,
"eval_avg_sts": 0.7716849957034901,
"eval_sickr_spearman": 0.7262548936993011,
"eval_stsb_spearman": 0.8171150977076791,
"step": 3000
},
{
"epoch": 0.2,
"eval_avg_sts": 0.7711561198226983,
"eval_sickr_spearman": 0.7262503241591916,
"eval_stsb_spearman": 0.816061915486205,
"step": 3125
},
{
"epoch": 0.21,
"eval_avg_sts": 0.7783568816799603,
"eval_sickr_spearman": 0.7303159233258935,
"eval_stsb_spearman": 0.8263978400340272,
"step": 3250
},
{
"epoch": 0.22,
"eval_avg_sts": 0.7809228297940308,
"eval_sickr_spearman": 0.7337628272894983,
"eval_stsb_spearman": 0.8280828322985634,
"step": 3375
},
{
"epoch": 0.22,
"learning_rate": 6.2160501727889415e-06,
"loss": 0.0001,
"step": 3500
},
{
"epoch": 0.22,
"eval_avg_sts": 0.7797812899347809,
"eval_sickr_spearman": 0.7324181485736369,
"eval_stsb_spearman": 0.8271444312959251,
"step": 3500
},
{
"epoch": 0.23,
"eval_avg_sts": 0.780044187865891,
"eval_sickr_spearman": 0.7338939041653229,
"eval_stsb_spearman": 0.8261944715664592,
"step": 3625
},
{
"epoch": 0.24,
"eval_avg_sts": 0.7787673562775448,
"eval_sickr_spearman": 0.7328702653314738,
"eval_stsb_spearman": 0.8246644472236156,
"step": 3750
},
{
"epoch": 0.25,
"eval_avg_sts": 0.779541327716536,
"eval_sickr_spearman": 0.7329598913667574,
"eval_stsb_spearman": 0.8261227640663145,
"step": 3875
},
{
"epoch": 0.26,
"learning_rate": 6.104057340330219e-06,
"loss": 0.0003,
"step": 4000
},
{
"epoch": 0.26,
"eval_avg_sts": 0.7747719384340315,
"eval_sickr_spearman": 0.7285930957484098,
"eval_stsb_spearman": 0.8209507811196531,
"step": 4000
},
{
"epoch": 0.26,
"eval_avg_sts": 0.7765396311685044,
"eval_sickr_spearman": 0.7301922912707919,
"eval_stsb_spearman": 0.8228869710662171,
"step": 4125
},
{
"epoch": 0.27,
"eval_avg_sts": 0.7728155845030844,
"eval_sickr_spearman": 0.7257823156922516,
"eval_stsb_spearman": 0.8198488533139171,
"step": 4250
},
{
"epoch": 0.28,
"eval_avg_sts": 0.7734186821765212,
"eval_sickr_spearman": 0.7266760303967105,
"eval_stsb_spearman": 0.8201613339563318,
"step": 4375
},
{
"epoch": 0.29,
"learning_rate": 5.992064507871497e-06,
"loss": 0.0004,
"step": 4500
},
{
"epoch": 0.29,
"eval_avg_sts": 0.7731296739509669,
"eval_sickr_spearman": 0.7214541370794603,
"eval_stsb_spearman": 0.8248052108224735,
"step": 4500
},
{
"epoch": 0.3,
"eval_avg_sts": 0.7728203601265164,
"eval_sickr_spearman": 0.7219969845879138,
"eval_stsb_spearman": 0.8236437356651191,
"step": 4625
},
{
"epoch": 0.3,
"eval_avg_sts": 0.773140320693449,
"eval_sickr_spearman": 0.7226297943493609,
"eval_stsb_spearman": 0.823650847037537,
"step": 4750
},
{
"epoch": 0.31,
"eval_avg_sts": 0.7776841987101548,
"eval_sickr_spearman": 0.7260857761911376,
"eval_stsb_spearman": 0.8292826212291721,
"step": 4875
},
{
"epoch": 0.32,
"learning_rate": 5.880071675412773e-06,
"loss": 0.0001,
"step": 5000
},
{
"epoch": 0.32,
"eval_avg_sts": 0.7787697170418183,
"eval_sickr_spearman": 0.7268813633553585,
"eval_stsb_spearman": 0.8306580707282781,
"step": 5000
},
{
"epoch": 0.33,
"eval_avg_sts": 0.7794054673251014,
"eval_sickr_spearman": 0.727022190544775,
"eval_stsb_spearman": 0.8317887441054277,
"step": 5125
},
{
"epoch": 0.34,
"eval_avg_sts": 0.7794784586068343,
"eval_sickr_spearman": 0.7302013691489637,
"eval_stsb_spearman": 0.8287555480647049,
"step": 5250
},
{
"epoch": 0.34,
"eval_avg_sts": 0.7771717407788259,
"eval_sickr_spearman": 0.7244288472848269,
"eval_stsb_spearman": 0.829914634272825,
"step": 5375
},
{
"epoch": 0.35,
"learning_rate": 5.7680788429540505e-06,
"loss": 0.0003,
"step": 5500
},
{
"epoch": 0.35,
"eval_avg_sts": 0.778478777290903,
"eval_sickr_spearman": 0.7256252059594475,
"eval_stsb_spearman": 0.8313323486223586,
"step": 5500
},
{
"epoch": 0.36,
"eval_avg_sts": 0.7793214110914728,
"eval_sickr_spearman": 0.726303453142855,
"eval_stsb_spearman": 0.8323393690400904,
"step": 5625
},
{
"epoch": 0.37,
"eval_avg_sts": 0.7791715295390024,
"eval_sickr_spearman": 0.7257507592586067,
"eval_stsb_spearman": 0.8325922998193981,
"step": 5750
},
{
"epoch": 0.38,
"eval_avg_sts": 0.7800081020871235,
"eval_sickr_spearman": 0.726603503433539,
"eval_stsb_spearman": 0.8334127007407081,
"step": 5875
},
{
"epoch": 0.38,
"learning_rate": 5.656086010495328e-06,
"loss": 0.0001,
"step": 6000
},
{
"epoch": 0.38,
"eval_avg_sts": 0.7802662913925068,
"eval_sickr_spearman": 0.7272382344390437,
"eval_stsb_spearman": 0.8332943483459699,
"step": 6000
},
{
"epoch": 0.39,
"eval_avg_sts": 0.7788831909074992,
"eval_sickr_spearman": 0.7254892779423776,
"eval_stsb_spearman": 0.8322771038726209,
"step": 6125
},
{
"epoch": 0.4,
"eval_avg_sts": 0.7790896526834474,
"eval_sickr_spearman": 0.7246235173389557,
"eval_stsb_spearman": 0.8335557880279391,
"step": 6250
},
{
"epoch": 0.41,
"eval_avg_sts": 0.7811606337604482,
"eval_sickr_spearman": 0.7249414832304759,
"eval_stsb_spearman": 0.8373797842904204,
"step": 6375
},
{
"epoch": 0.42,
"learning_rate": 5.544093178036605e-06,
"loss": 0.0001,
"step": 6500
},
{
"epoch": 0.42,
"eval_avg_sts": 0.7814213566702608,
"eval_sickr_spearman": 0.7254279422258411,
"eval_stsb_spearman": 0.8374147711146805,
"step": 6500
},
{
"epoch": 0.42,
"eval_avg_sts": 0.7818500804137162,
"eval_sickr_spearman": 0.726220023119657,
"eval_stsb_spearman": 0.8374801377077753,
"step": 6625
},
{
"epoch": 0.43,
"eval_avg_sts": 0.7832040571269738,
"eval_sickr_spearman": 0.7301835015792287,
"eval_stsb_spearman": 0.8362246126747188,
"step": 6750
},
{
"epoch": 0.44,
"eval_avg_sts": 0.7841900708722672,
"eval_sickr_spearman": 0.731056755034475,
"eval_stsb_spearman": 0.8373233867100595,
"step": 6875
},
{
"epoch": 0.45,
"learning_rate": 5.432100345577883e-06,
"loss": 0.0001,
"step": 7000
},
{
"epoch": 0.45,
"eval_avg_sts": 0.7862472754964975,
"eval_sickr_spearman": 0.7333967342343369,
"eval_stsb_spearman": 0.839097816758658,
"step": 7000
},
{
"epoch": 0.46,
"eval_avg_sts": 0.7859634761320248,
"eval_sickr_spearman": 0.7330241089493801,
"eval_stsb_spearman": 0.8389028433146695,
"step": 7125
},
{
"epoch": 0.46,
"eval_avg_sts": 0.7821803440191185,
"eval_sickr_spearman": 0.7303841755210372,
"eval_stsb_spearman": 0.8339765125171998,
"step": 7250
},
{
"epoch": 0.47,
"eval_avg_sts": 0.7825744125697178,
"eval_sickr_spearman": 0.7306357624303699,
"eval_stsb_spearman": 0.8345130627090659,
"step": 7375
},
{
"epoch": 0.48,
"learning_rate": 5.32010751311916e-06,
"loss": 0.0001,
"step": 7500
},
{
"epoch": 0.48,
"eval_avg_sts": 0.78116110534451,
"eval_sickr_spearman": 0.7276775268927966,
"eval_stsb_spearman": 0.8346446837962234,
"step": 7500
},
{
"epoch": 0.49,
"eval_avg_sts": 0.7799908773501631,
"eval_sickr_spearman": 0.7237501678215064,
"eval_stsb_spearman": 0.83623158687882,
"step": 7625
},
{
"epoch": 0.5,
"eval_avg_sts": 0.780269211830304,
"eval_sickr_spearman": 0.7244608359983847,
"eval_stsb_spearman": 0.8360775876622232,
"step": 7750
},
{
"epoch": 0.5,
"eval_avg_sts": 0.7807594418954099,
"eval_sickr_spearman": 0.7247573319875622,
"eval_stsb_spearman": 0.8367615518032576,
"step": 7875
},
{
"epoch": 0.51,
"learning_rate": 5.2081146806604376e-06,
"loss": 0.0001,
"step": 8000
},
{
"epoch": 0.51,
"eval_avg_sts": 0.7809657512161441,
"eval_sickr_spearman": 0.7257775125821077,
"eval_stsb_spearman": 0.8361539898501805,
"step": 8000
},
{
"epoch": 0.52,
"eval_avg_sts": 0.7808305047079998,
"eval_sickr_spearman": 0.7258256397457487,
"eval_stsb_spearman": 0.8358353696702507,
"step": 8125
},
{
"epoch": 0.53,
"eval_avg_sts": 0.7808244974473546,
"eval_sickr_spearman": 0.7260765061885599,
"eval_stsb_spearman": 0.8355724887061494,
"step": 8250
},
{
"epoch": 0.54,
"eval_avg_sts": 0.7807531331871759,
"eval_sickr_spearman": 0.725998455648723,
"eval_stsb_spearman": 0.8355078107256287,
"step": 8375
},
{
"epoch": 0.54,
"learning_rate": 5.096121848201715e-06,
"loss": 0.0001,
"step": 8500
},
{
"epoch": 0.54,
"eval_avg_sts": 0.7805553727181309,
"eval_sickr_spearman": 0.7259074847425994,
"eval_stsb_spearman": 0.8352032606936624,
"step": 8500
},
{
"epoch": 0.55,
"eval_avg_sts": 0.7840901636781107,
"eval_sickr_spearman": 0.727197936344937,
"eval_stsb_spearman": 0.8409823910112844,
"step": 8625
},
{
"epoch": 0.56,
"eval_avg_sts": 0.7841336470257416,
"eval_sickr_spearman": 0.7241774524998998,
"eval_stsb_spearman": 0.8440898415515834,
"step": 8750
},
{
"epoch": 0.57,
"eval_avg_sts": 0.7848770188208263,
"eval_sickr_spearman": 0.7246812987539857,
"eval_stsb_spearman": 0.8450727388876668,
"step": 8875
},
{
"epoch": 0.58,
"learning_rate": 4.984129015742992e-06,
"loss": 0.0001,
"step": 9000
},
{
"epoch": 0.58,
"eval_avg_sts": 0.7851602291221325,
"eval_sickr_spearman": 0.7257603654788943,
"eval_stsb_spearman": 0.8445600927653706,
"step": 9000
},
{
"epoch": 0.58,
"eval_avg_sts": 0.7881113225894085,
"eval_sickr_spearman": 0.7297208179790754,
"eval_stsb_spearman": 0.8465018271997418,
"step": 9125
},
{
"epoch": 0.59,
"eval_avg_sts": 0.7883865180777926,
"eval_sickr_spearman": 0.7305029084037921,
"eval_stsb_spearman": 0.8462701277517931,
"step": 9250
},
{
"epoch": 0.6,
"eval_avg_sts": 0.7905936766250409,
"eval_sickr_spearman": 0.7318727073857056,
"eval_stsb_spearman": 0.8493146458643761,
"step": 9375
},
{
"epoch": 0.61,
"learning_rate": 4.872136183284269e-06,
"loss": 0.0002,
"step": 9500
},
{
"epoch": 0.61,
"eval_avg_sts": 0.7894195399749903,
"eval_sickr_spearman": 0.7297918559781024,
"eval_stsb_spearman": 0.8490472239718782,
"step": 9500
},
{
"epoch": 0.62,
"eval_avg_sts": 0.7888302258840285,
"eval_sickr_spearman": 0.7290175946229199,
"eval_stsb_spearman": 0.848642857145137,
"step": 9625
},
{
"epoch": 0.62,
"eval_avg_sts": 0.7898168606884958,
"eval_sickr_spearman": 0.7311126152054476,
"eval_stsb_spearman": 0.848521106171544,
"step": 9750
},
{
"epoch": 0.63,
"eval_avg_sts": 0.7916780015304804,
"eval_sickr_spearman": 0.7336695508905056,
"eval_stsb_spearman": 0.8496864521704552,
"step": 9875
},
{
"epoch": 0.64,
"learning_rate": 4.760143350825547e-06,
"loss": 0.0001,
"step": 10000
},
{
"epoch": 0.64,
"eval_avg_sts": 0.7916349913886156,
"eval_sickr_spearman": 0.7339293030870828,
"eval_stsb_spearman": 0.8493406796901484,
"step": 10000
},
{
"epoch": 0.65,
"eval_avg_sts": 0.791507759549186,
"eval_sickr_spearman": 0.7339989962152694,
"eval_stsb_spearman": 0.8490165228831026,
"step": 10125
},
{
"epoch": 0.66,
"eval_avg_sts": 0.789931989918206,
"eval_sickr_spearman": 0.7311775052234905,
"eval_stsb_spearman": 0.8486864746129216,
"step": 10250
},
{
"epoch": 0.66,
"eval_avg_sts": 0.7899616736779131,
"eval_sickr_spearman": 0.7317643492208613,
"eval_stsb_spearman": 0.8481589981349649,
"step": 10375
},
{
"epoch": 0.67,
"learning_rate": 4.648150518366825e-06,
"loss": 0.0001,
"step": 10500
},
{
"epoch": 0.67,
"eval_avg_sts": 0.7926863693434811,
"eval_sickr_spearman": 0.7347004424206716,
"eval_stsb_spearman": 0.8506722962662906,
"step": 10500
},
{
"epoch": 0.68,
"eval_avg_sts": 0.7925310701894714,
"eval_sickr_spearman": 0.7345030826248625,
"eval_stsb_spearman": 0.8505590577540805,
"step": 10625
},
{
"epoch": 0.69,
"eval_avg_sts": 0.7921847237714013,
"eval_sickr_spearman": 0.734286503995874,
"eval_stsb_spearman": 0.8500829435469286,
"step": 10750
},
{
"epoch": 0.7,
"eval_avg_sts": 0.792045037000692,
"eval_sickr_spearman": 0.7345833425953655,
"eval_stsb_spearman": 0.8495067314060183,
"step": 10875
},
{
"epoch": 0.7,
"learning_rate": 4.536157685908102e-06,
"loss": 0.0001,
"step": 11000
},
{
"epoch": 0.7,
"eval_avg_sts": 0.7924996456713199,
"eval_sickr_spearman": 0.7354074602338407,
"eval_stsb_spearman": 0.8495918311087991,
"step": 11000
},
{
"epoch": 0.71,
"eval_avg_sts": 0.7924266596358673,
"eval_sickr_spearman": 0.7356516503535521,
"eval_stsb_spearman": 0.8492016689181826,
"step": 11125
},
{
"epoch": 0.72,
"eval_avg_sts": 0.7926706111519558,
"eval_sickr_spearman": 0.7358917097985398,
"eval_stsb_spearman": 0.8494495125053718,
"step": 11250
},
{
"epoch": 0.73,
"eval_avg_sts": 0.7930288164708986,
"eval_sickr_spearman": 0.7354914185991545,
"eval_stsb_spearman": 0.8505662143426428,
"step": 11375
},
{
"epoch": 0.74,
"learning_rate": 4.424164853449379e-06,
"loss": 0.0002,
"step": 11500
},
{
"epoch": 0.74,
"eval_avg_sts": 0.7926251189281965,
"eval_sickr_spearman": 0.7351442017668584,
"eval_stsb_spearman": 0.8501060360895348,
"step": 11500
},
{
"epoch": 0.74,
"eval_avg_sts": 0.7932695687388167,
"eval_sickr_spearman": 0.7365684199867013,
"eval_stsb_spearman": 0.8499707174909322,
"step": 11625
},
{
"epoch": 0.75,
"eval_avg_sts": 0.7935921856407616,
"eval_sickr_spearman": 0.7367729844477262,
"eval_stsb_spearman": 0.850411386833797,
"step": 11750
},
{
"epoch": 0.76,
"eval_avg_sts": 0.794782209944985,
"eval_sickr_spearman": 0.7389587838119719,
"eval_stsb_spearman": 0.8506056360779983,
"step": 11875
},
{
"epoch": 0.77,
"learning_rate": 4.312172020990656e-06,
"loss": 0.0002,
"step": 12000
},
{
"epoch": 0.77,
"eval_avg_sts": 0.7971707208949131,
"eval_sickr_spearman": 0.7394768953031847,
"eval_stsb_spearman": 0.8548645464866416,
"step": 12000
},
{
"epoch": 0.78,
"eval_avg_sts": 0.797638118412404,
"eval_sickr_spearman": 0.7421029957743136,
"eval_stsb_spearman": 0.8531732410504944,
"step": 12125
},
{
"epoch": 0.78,
"eval_avg_sts": 0.7969091025343611,
"eval_sickr_spearman": 0.741429359576644,
"eval_stsb_spearman": 0.8523888454920783,
"step": 12250
},
{
"epoch": 0.79,
"eval_avg_sts": 0.7919648350492454,
"eval_sickr_spearman": 0.7347034683800623,
"eval_stsb_spearman": 0.8492262017184287,
"step": 12375
},
{
"epoch": 0.8,
"learning_rate": 4.2001791885319345e-06,
"loss": 0.0005,
"step": 12500
},
{
"epoch": 0.8,
"eval_avg_sts": 0.7921636059370547,
"eval_sickr_spearman": 0.7353516480939697,
"eval_stsb_spearman": 0.8489755637801396,
"step": 12500
},
{
"epoch": 0.81,
"eval_avg_sts": 0.7924202367929077,
"eval_sickr_spearman": 0.736975675695795,
"eval_stsb_spearman": 0.8478647978900204,
"step": 12625
},
{
"epoch": 0.82,
"eval_avg_sts": 0.7890475112371416,
"eval_sickr_spearman": 0.7355575093947334,
"eval_stsb_spearman": 0.8425375130795496,
"step": 12750
},
{
"epoch": 0.82,
"eval_avg_sts": 0.7892144058224184,
"eval_sickr_spearman": 0.7356575101479275,
"eval_stsb_spearman": 0.8427713014969095,
"step": 12875
},
{
"epoch": 0.83,
"learning_rate": 4.088186356073212e-06,
"loss": 0.0002,
"step": 13000
},
{
"epoch": 0.83,
"eval_avg_sts": 0.7908518455947956,
"eval_sickr_spearman": 0.73698621219475,
"eval_stsb_spearman": 0.8447174789948412,
"step": 13000
},
{
"epoch": 0.84,
"eval_avg_sts": 0.7910358332545967,
"eval_sickr_spearman": 0.7372511340625426,
"eval_stsb_spearman": 0.8448205324466508,
"step": 13125
},
{
"epoch": 0.85,
"eval_avg_sts": 0.7910819619646265,
"eval_sickr_spearman": 0.7366442130647706,
"eval_stsb_spearman": 0.8455197108644826,
"step": 13250
},
{
"epoch": 0.86,
"eval_avg_sts": 0.7913313391681369,
"eval_sickr_spearman": 0.7369983463756739,
"eval_stsb_spearman": 0.8456643319606,
"step": 13375
},
{
"epoch": 0.86,
"learning_rate": 3.976193523614489e-06,
"loss": 0.0002,
"step": 13500
},
{
"epoch": 0.86,
"eval_avg_sts": 0.7912515138401426,
"eval_sickr_spearman": 0.7371570411348254,
"eval_stsb_spearman": 0.8453459865454599,
"step": 13500
},
{
"epoch": 0.87,
"eval_avg_sts": 0.7912798783058242,
"eval_sickr_spearman": 0.7375416261640404,
"eval_stsb_spearman": 0.8450181304476081,
"step": 13625
},
{
"epoch": 0.88,
"eval_avg_sts": 0.7915843291718891,
"eval_sickr_spearman": 0.7376919154804402,
"eval_stsb_spearman": 0.845476742863338,
"step": 13750
},
{
"epoch": 0.89,
"eval_avg_sts": 0.7917255539871094,
"eval_sickr_spearman": 0.7381062797925467,
"eval_stsb_spearman": 0.8453448281816721,
"step": 13875
},
{
"epoch": 0.9,
"learning_rate": 3.864200691155766e-06,
"loss": 0.0001,
"step": 14000
},
{
"epoch": 0.9,
"eval_avg_sts": 0.7916416194141285,
"eval_sickr_spearman": 0.7380577683800943,
"eval_stsb_spearman": 0.8452254704481627,
"step": 14000
},
{
"epoch": 0.9,
"eval_avg_sts": 0.7924269371428458,
"eval_sickr_spearman": 0.738714977941072,
"eval_stsb_spearman": 0.8461388963446196,
"step": 14125
},
{
"epoch": 0.91,
"eval_avg_sts": 0.7923356777507629,
"eval_sickr_spearman": 0.7386597902055195,
"eval_stsb_spearman": 0.8460115652960062,
"step": 14250
},
{
"epoch": 0.92,
"eval_avg_sts": 0.7922805942330418,
"eval_sickr_spearman": 0.7387613759850612,
"eval_stsb_spearman": 0.8457998124810223,
"step": 14375
},
{
"epoch": 0.93,
"learning_rate": 3.7522078586970435e-06,
"loss": 0.0001,
"step": 14500
},
{
"epoch": 0.93,
"eval_avg_sts": 0.7934966210957259,
"eval_sickr_spearman": 0.7397510568301936,
"eval_stsb_spearman": 0.8472421853612582,
"step": 14500
},
{
"epoch": 0.94,
"eval_avg_sts": 0.7930449265696451,
"eval_sickr_spearman": 0.7393639741837038,
"eval_stsb_spearman": 0.8467258789555864,
"step": 14625
},
{
"epoch": 0.94,
"eval_avg_sts": 0.7924737714972381,
"eval_sickr_spearman": 0.7393996612920722,
"eval_stsb_spearman": 0.845547881702404,
"step": 14750
},
{
"epoch": 0.95,
"eval_avg_sts": 0.792308440851152,
"eval_sickr_spearman": 0.739175211955052,
"eval_stsb_spearman": 0.845441669747252,
"step": 14875
},
{
"epoch": 0.96,
"learning_rate": 3.6402150262383203e-06,
"loss": 0.0001,
"step": 15000
},
{
"epoch": 0.96,
"eval_avg_sts": 0.7932488441451628,
"eval_sickr_spearman": 0.7404715713828667,
"eval_stsb_spearman": 0.8460261169074589,
"step": 15000
},
{
"epoch": 0.97,
"eval_avg_sts": 0.7931158785146848,
"eval_sickr_spearman": 0.7406130710077032,
"eval_stsb_spearman": 0.8456186860216665,
"step": 15125
},
{
"epoch": 0.98,
"eval_avg_sts": 0.7945903311020877,
"eval_sickr_spearman": 0.7431428210893474,
"eval_stsb_spearman": 0.8460378411148278,
"step": 15250
},
{
"epoch": 0.98,
"eval_avg_sts": 0.7948596387785098,
"eval_sickr_spearman": 0.7440196288461001,
"eval_stsb_spearman": 0.8456996487109196,
"step": 15375
},
{
"epoch": 0.99,
"learning_rate": 3.5282221937795976e-06,
"loss": 0.0002,
"step": 15500
},
{
"epoch": 0.99,
"eval_avg_sts": 0.7948372805541641,
"eval_sickr_spearman": 0.744097679385937,
"eval_stsb_spearman": 0.8455768817223914,
"step": 15500
},
{
"epoch": 1.0,
"eval_avg_sts": 0.7937246352478757,
"eval_sickr_spearman": 0.7439027691763012,
"eval_stsb_spearman": 0.8435465013194503,
"step": 15625
},
{
"epoch": 1.01,
"eval_avg_sts": 0.7937099307469273,
"eval_sickr_spearman": 0.7440485435691657,
"eval_stsb_spearman": 0.8433713179246888,
"step": 15750
},
{
"epoch": 1.02,
"eval_avg_sts": 0.7935877720189825,
"eval_sickr_spearman": 0.7440728953375949,
"eval_stsb_spearman": 0.84310264870037,
"step": 15875
},
{
"epoch": 1.02,
"learning_rate": 3.4162293613208757e-06,
"loss": 0.0001,
"step": 16000
},
{
"epoch": 1.02,
"eval_avg_sts": 0.7935863758797379,
"eval_sickr_spearman": 0.744390621073608,
"eval_stsb_spearman": 0.8427821306858677,
"step": 16000
},
{
"epoch": 1.03,
"eval_avg_sts": 0.7937197747425322,
"eval_sickr_spearman": 0.7444404293257993,
"eval_stsb_spearman": 0.8429991201592651,
"step": 16125
},
{
"epoch": 1.04,
"eval_avg_sts": 0.7924446512199308,
"eval_sickr_spearman": 0.7440353830473717,
"eval_stsb_spearman": 0.8408539193924898,
"step": 16250
},
{
"epoch": 1.05,
"eval_avg_sts": 0.7905555822474897,
"eval_sickr_spearman": 0.7383070017654566,
"eval_stsb_spearman": 0.8428041627295226,
"step": 16375
},
{
"epoch": 1.06,
"learning_rate": 3.304236528862153e-06,
"loss": 0.0001,
"step": 16500
},
{
"epoch": 1.06,
"eval_avg_sts": 0.7899406430528368,
"eval_sickr_spearman": 0.737816219970962,
"eval_stsb_spearman": 0.8420650661347118,
"step": 16500
},
{
"epoch": 1.06,
"eval_avg_sts": 0.7921524290697161,
"eval_sickr_spearman": 0.7417105816755641,
"eval_stsb_spearman": 0.842594276463868,
"step": 16625
},
{
"epoch": 1.07,
"eval_avg_sts": 0.7909061020892134,
"eval_sickr_spearman": 0.7410022670226564,
"eval_stsb_spearman": 0.8408099371557706,
"step": 16750
},
{
"epoch": 1.08,
"eval_avg_sts": 0.7911860344103485,
"eval_sickr_spearman": 0.7404902554813262,
"eval_stsb_spearman": 0.841881813339371,
"step": 16875
},
{
"epoch": 1.09,
"learning_rate": 3.19224369640343e-06,
"loss": 0.0002,
"step": 17000
},
{
"epoch": 1.09,
"eval_avg_sts": 0.7912332320403954,
"eval_sickr_spearman": 0.7405556258103834,
"eval_stsb_spearman": 0.8419108382704075,
"step": 17000
},
{
"epoch": 1.1,
"eval_avg_sts": 0.791745368257589,
"eval_sickr_spearman": 0.7407413620796446,
"eval_stsb_spearman": 0.8427493744355335,
"step": 17125
},
{
"epoch": 1.1,
"eval_avg_sts": 0.7936116457907827,
"eval_sickr_spearman": 0.7417212926111849,
"eval_stsb_spearman": 0.8455019989703806,
"step": 17250
},
{
"epoch": 1.11,
"eval_avg_sts": 0.7936037695250758,
"eval_sickr_spearman": 0.7418167304097425,
"eval_stsb_spearman": 0.8453908086404092,
"step": 17375
},
{
"epoch": 1.12,
"learning_rate": 3.0802508639447074e-06,
"loss": 0.0002,
"step": 17500
},
{
"epoch": 1.12,
"eval_avg_sts": 0.792413452164604,
"eval_sickr_spearman": 0.7425937295377067,
"eval_stsb_spearman": 0.8422331747915013,
"step": 17500
},
{
"epoch": 1.13,
"eval_avg_sts": 0.7927184217670188,
"eval_sickr_spearman": 0.7428243748868126,
"eval_stsb_spearman": 0.8426124686472249,
"step": 17625
},
{
"epoch": 1.14,
"eval_avg_sts": 0.7926960182448954,
"eval_sickr_spearman": 0.742725526880053,
"eval_stsb_spearman": 0.842666509609738,
"step": 17750
},
{
"epoch": 1.14,
"eval_avg_sts": 0.7927521207425385,
"eval_sickr_spearman": 0.7428051144151359,
"eval_stsb_spearman": 0.8426991270699412,
"step": 17875
},
{
"epoch": 1.15,
"learning_rate": 2.9682580314859847e-06,
"loss": 0.0,
"step": 18000
},
{
"epoch": 1.15,
"eval_avg_sts": 0.7928433137943678,
"eval_sickr_spearman": 0.7426588116801555,
"eval_stsb_spearman": 0.8430278159085801,
"step": 18000
},
{
"epoch": 1.16,
"eval_avg_sts": 0.792833492411573,
"eval_sickr_spearman": 0.7426310977346257,
"eval_stsb_spearman": 0.8430358870885203,
"step": 18125
},
{
"epoch": 1.17,
"eval_avg_sts": 0.7928841848486375,
"eval_sickr_spearman": 0.742908285221025,
"eval_stsb_spearman": 0.84286008447625,
"step": 18250
},
{
"epoch": 1.18,
"eval_avg_sts": 0.7925150543842555,
"eval_sickr_spearman": 0.743895084200071,
"eval_stsb_spearman": 0.84113502456844,
"step": 18375
},
{
"epoch": 1.18,
"learning_rate": 2.8562651990272623e-06,
"loss": 0.0001,
"step": 18500
},
{
"epoch": 1.18,
"eval_avg_sts": 0.7919487675309846,
"eval_sickr_spearman": 0.7431525714029392,
"eval_stsb_spearman": 0.84074496365903,
"step": 18500
},
{
"epoch": 1.19,
"eval_avg_sts": 0.7919787220051326,
"eval_sickr_spearman": 0.7432353770218185,
"eval_stsb_spearman": 0.8407220669884469,
"step": 18625
},
{
"epoch": 1.2,
"eval_avg_sts": 0.7920516311468476,
"eval_sickr_spearman": 0.7433836010008565,
"eval_stsb_spearman": 0.8407196612928387,
"step": 18750
},
{
"epoch": 1.21,
"eval_avg_sts": 0.79208040900112,
"eval_sickr_spearman": 0.7434916709790923,
"eval_stsb_spearman": 0.8406691470231478,
"step": 18875
},
{
"epoch": 1.22,
"learning_rate": 2.7442723665685396e-06,
"loss": 0.0001,
"step": 19000
},
{
"epoch": 1.22,
"eval_avg_sts": 0.7915679899923007,
"eval_sickr_spearman": 0.7422913257230525,
"eval_stsb_spearman": 0.8408446542615489,
"step": 19000
},
{
"epoch": 1.22,
"eval_avg_sts": 0.7924488788916606,
"eval_sickr_spearman": 0.7431180370410052,
"eval_stsb_spearman": 0.8417797207423161,
"step": 19125
},
{
"epoch": 1.23,
"eval_avg_sts": 0.7925131080137356,
"eval_sickr_spearman": 0.7439811559338482,
"eval_stsb_spearman": 0.8410450600936231,
"step": 19250
},
{
"epoch": 1.24,
"eval_avg_sts": 0.7923092664958495,
"eval_sickr_spearman": 0.7438394641846057,
"eval_stsb_spearman": 0.8407790688070933,
"step": 19375
},
{
"epoch": 1.25,
"learning_rate": 2.632279534109817e-06,
"loss": 0.0002,
"step": 19500
},
{
"epoch": 1.25,
"eval_avg_sts": 0.7915084313605771,
"eval_sickr_spearman": 0.7429506966835948,
"eval_stsb_spearman": 0.8400661660375595,
"step": 19500
},
{
"epoch": 1.26,
"eval_avg_sts": 0.7914848286255316,
"eval_sickr_spearman": 0.7429546352339128,
"eval_stsb_spearman": 0.8400150220171504,
"step": 19625
},
{
"epoch": 1.26,
"eval_avg_sts": 0.7919444499131418,
"eval_sickr_spearman": 0.7435056960607123,
"eval_stsb_spearman": 0.8403832037655713,
"step": 19750
},
{
"epoch": 1.27,
"eval_avg_sts": 0.7918604283998938,
"eval_sickr_spearman": 0.7430511777478034,
"eval_stsb_spearman": 0.8406696790519842,
"step": 19875
},
{
"epoch": 1.28,
"learning_rate": 2.5202867016510945e-06,
"loss": 0.0001,
"step": 20000
},
{
"epoch": 1.28,
"eval_avg_sts": 0.7901084692338984,
"eval_sickr_spearman": 0.7411617302794309,
"eval_stsb_spearman": 0.839055208188366,
"step": 20000
},
{
"epoch": 1.29,
"eval_avg_sts": 0.789757862825201,
"eval_sickr_spearman": 0.7407969340640084,
"eval_stsb_spearman": 0.8387187915863936,
"step": 20125
},
{
"epoch": 1.3,
"eval_avg_sts": 0.7898529068915039,
"eval_sickr_spearman": 0.7409771947877056,
"eval_stsb_spearman": 0.8387286189953022,
"step": 20250
},
{
"epoch": 1.3,
"eval_avg_sts": 0.789768082574833,
"eval_sickr_spearman": 0.74083372588771,
"eval_stsb_spearman": 0.838702439261956,
"step": 20375
},
{
"epoch": 1.31,
"learning_rate": 2.4082938691923718e-06,
"loss": 0.0,
"step": 20500
},
{
"epoch": 1.31,
"eval_avg_sts": 0.7897954058339804,
"eval_sickr_spearman": 0.7408093260881794,
"eval_stsb_spearman": 0.8387814855797816,
"step": 20500
},
{
"epoch": 1.32,
"eval_avg_sts": 0.7899947832336973,
"eval_sickr_spearman": 0.7409338707342086,
"eval_stsb_spearman": 0.8390556957331861,
"step": 20625
},
{
"epoch": 1.33,
"eval_avg_sts": 0.790202509592782,
"eval_sickr_spearman": 0.7411228731183674,
"eval_stsb_spearman": 0.8392821460671965,
"step": 20750
},
{
"epoch": 1.34,
"eval_avg_sts": 0.7901906011266497,
"eval_sickr_spearman": 0.7410648995789316,
"eval_stsb_spearman": 0.839316302674368,
"step": 20875
},
{
"epoch": 1.34,
"learning_rate": 2.296301036733649e-06,
"loss": 0.0,
"step": 21000
},
{
"epoch": 1.34,
"eval_avg_sts": 0.7902077356957227,
"eval_sickr_spearman": 0.7411439107407973,
"eval_stsb_spearman": 0.839271560650648,
"step": 21000
},
{
"epoch": 1.35,
"eval_avg_sts": 0.7901431265829444,
"eval_sickr_spearman": 0.7410307494658092,
"eval_stsb_spearman": 0.8392555037000796,
"step": 21125
},
{
"epoch": 1.36,
"eval_avg_sts": 0.7921962350985728,
"eval_sickr_spearman": 0.7434804797324572,
"eval_stsb_spearman": 0.8409119904646885,
"step": 21250
},
{
"epoch": 1.37,
"eval_avg_sts": 0.7922085580785473,
"eval_sickr_spearman": 0.7434956095294102,
"eval_stsb_spearman": 0.8409215066276844,
"step": 21375
},
{
"epoch": 1.38,
"learning_rate": 2.1843082042749267e-06,
"loss": 0.0001,
"step": 21500
},
{
"epoch": 1.38,
"eval_avg_sts": 0.7922422656604595,
"eval_sickr_spearman": 0.7434714018542854,
"eval_stsb_spearman": 0.8410131294666336,
"step": 21500
},
{
"epoch": 1.38,
"eval_avg_sts": 0.7922953172658802,
"eval_sickr_spearman": 0.7435230833194328,
"eval_stsb_spearman": 0.8410675512123275,
"step": 21625
},
{
"epoch": 1.39,
"eval_avg_sts": 0.7920827130593174,
"eval_sickr_spearman": 0.7432143393993886,
"eval_stsb_spearman": 0.8409510867192462,
"step": 21750
},
{
"epoch": 1.4,
"eval_avg_sts": 0.7893982619162593,
"eval_sickr_spearman": 0.7409595673734778,
"eval_stsb_spearman": 0.8378369564590408,
"step": 21875
},
{
"epoch": 1.41,
"learning_rate": 2.072315371816204e-06,
"loss": 0.0002,
"step": 22000
},
{
"epoch": 1.41,
"eval_avg_sts": 0.7906089294600861,
"eval_sickr_spearman": 0.7422200475685182,
"eval_stsb_spearman": 0.838997811351654,
"step": 22000
},
{
"epoch": 1.42,
"eval_avg_sts": 0.7914097742253603,
"eval_sickr_spearman": 0.7423016043787602,
"eval_stsb_spearman": 0.8405179440719603,
"step": 22125
},
{
"epoch": 1.42,
"eval_avg_sts": 0.791727396078017,
"eval_sickr_spearman": 0.7433686633283093,
"eval_stsb_spearman": 0.8400861288277247,
"step": 22250
},
{
"epoch": 1.43,
"eval_avg_sts": 0.7914842385018235,
"eval_sickr_spearman": 0.7423251876495663,
"eval_stsb_spearman": 0.8406432893540806,
"step": 22375
},
{
"epoch": 1.44,
"learning_rate": 1.9603225393574807e-06,
"loss": 0.0001,
"step": 22500
},
{
"epoch": 1.44,
"eval_avg_sts": 0.7915202710875588,
"eval_sickr_spearman": 0.7422767242682152,
"eval_stsb_spearman": 0.8407638179069024,
"step": 22500
},
{
"epoch": 1.45,
"eval_avg_sts": 0.7918702583757414,
"eval_sickr_spearman": 0.7429271614438903,
"eval_stsb_spearman": 0.8408133553075926,
"step": 22625
},
{
"epoch": 1.46,
"eval_avg_sts": 0.7916045718347005,
"eval_sickr_spearman": 0.7425266300889978,
"eval_stsb_spearman": 0.840682513580403,
"step": 22750
},
{
"epoch": 1.46,
"eval_avg_sts": 0.7915999641875153,
"eval_sickr_spearman": 0.7422474733274393,
"eval_stsb_spearman": 0.8409524550475914,
"step": 22875
},
{
"epoch": 1.47,
"learning_rate": 1.8483297068987584e-06,
"loss": 0.0002,
"step": 23000
},
{
"epoch": 1.47,
"eval_avg_sts": 0.792815682844469,
"eval_sickr_spearman": 0.7426967562502915,
"eval_stsb_spearman": 0.8429346094386464,
"step": 23000
},
{
"epoch": 1.48,
"eval_avg_sts": 0.7927916857497739,
"eval_sickr_spearman": 0.7425698100491905,
"eval_stsb_spearman": 0.8430135614503571,
"step": 23125
},
{
"epoch": 1.49,
"eval_avg_sts": 0.7928345271530053,
"eval_sickr_spearman": 0.7425940177243154,
"eval_stsb_spearman": 0.8430750365816952,
"step": 23250
},
{
"epoch": 1.5,
"eval_avg_sts": 0.7930442205998951,
"eval_sickr_spearman": 0.7427970932211958,
"eval_stsb_spearman": 0.8432913479785945,
"step": 23375
},
{
"epoch": 1.5,
"learning_rate": 1.7363368744400357e-06,
"loss": 0.0,
"step": 23500
},
{
"epoch": 1.5,
"eval_avg_sts": 0.793033132084566,
"eval_sickr_spearman": 0.7428263441619716,
"eval_stsb_spearman": 0.8432399200071605,
"step": 23500
},
{
"epoch": 1.51,
"eval_avg_sts": 0.7929242651260953,
"eval_sickr_spearman": 0.7427599171486827,
"eval_stsb_spearman": 0.8430886131035079,
"step": 23625
},
{
"epoch": 1.52,
"eval_avg_sts": 0.7936208486615127,
"eval_sickr_spearman": 0.7430878254782006,
"eval_stsb_spearman": 0.8441538718448248,
"step": 23750
},
{
"epoch": 1.53,
"eval_avg_sts": 0.7935886289185006,
"eval_sickr_spearman": 0.7430728878056534,
"eval_stsb_spearman": 0.8441043700313476,
"step": 23875
},
{
"epoch": 1.54,
"learning_rate": 1.6243440419813131e-06,
"loss": 0.0001,
"step": 24000
},
{
"epoch": 1.54,
"eval_avg_sts": 0.7935571381985222,
"eval_sickr_spearman": 0.7430181323500139,
"eval_stsb_spearman": 0.8440961440470305,
"step": 24000
},
{
"epoch": 1.54,
"eval_avg_sts": 0.7935492855380204,
"eval_sickr_spearman": 0.7430870569805776,
"eval_stsb_spearman": 0.8440115140954632,
"step": 24125
},
{
"epoch": 1.55,
"eval_avg_sts": 0.7936128430055818,
"eval_sickr_spearman": 0.7431491611947371,
"eval_stsb_spearman": 0.8440765248164266,
"step": 24250
},
{
"epoch": 1.56,
"eval_avg_sts": 0.7936605492215507,
"eval_sickr_spearman": 0.7432605933500736,
"eval_stsb_spearman": 0.844060505093028,
"step": 24375
},
{
"epoch": 1.57,
"learning_rate": 1.5123512095225906e-06,
"loss": 0.0,
"step": 24500
},
{
"epoch": 1.57,
"eval_avg_sts": 0.793667841726459,
"eval_sickr_spearman": 0.7432775483288812,
"eval_stsb_spearman": 0.8440581351240368,
"step": 24500
},
{
"epoch": 1.58,
"eval_avg_sts": 0.7948942597846932,
"eval_sickr_spearman": 0.744056468700903,
"eval_stsb_spearman": 0.8457320508684834,
"step": 24625
},
{
"epoch": 1.58,
"eval_avg_sts": 0.7948721522573494,
"eval_sickr_spearman": 0.7440626647129885,
"eval_stsb_spearman": 0.8456816398017104,
"step": 24750
},
{
"epoch": 1.59,
"eval_avg_sts": 0.7945095949089607,
"eval_sickr_spearman": 0.7443504190417043,
"eval_stsb_spearman": 0.8446687707762169,
"step": 24875
},
{
"epoch": 1.6,
"learning_rate": 1.4003583770638678e-06,
"loss": 0.0001,
"step": 25000
},
{
"epoch": 1.6,
"eval_avg_sts": 0.7947724077574231,
"eval_sickr_spearman": 0.7446924004839437,
"eval_stsb_spearman": 0.8448524150309025,
"step": 25000
},
{
"epoch": 1.61,
"eval_avg_sts": 0.7959915253602992,
"eval_sickr_spearman": 0.7461332854959857,
"eval_stsb_spearman": 0.8458497652246126,
"step": 25125
},
{
"epoch": 1.62,
"eval_avg_sts": 0.7955281876289857,
"eval_sickr_spearman": 0.7458754244134463,
"eval_stsb_spearman": 0.845180950844525,
"step": 25250
},
{
"epoch": 1.62,
"eval_avg_sts": 0.79543745522762,
"eval_sickr_spearman": 0.7456630610129066,
"eval_stsb_spearman": 0.8452118494423333,
"step": 25375
},
{
"epoch": 1.63,
"learning_rate": 1.2883655446051453e-06,
"loss": 0.0001,
"step": 25500
},
{
"epoch": 1.63,
"eval_avg_sts": 0.795353488562289,
"eval_sickr_spearman": 0.7455269408714309,
"eval_stsb_spearman": 0.8451800362531473,
"step": 25500
},
{
"epoch": 1.64,
"eval_avg_sts": 0.7953584932327289,
"eval_sickr_spearman": 0.745271175256273,
"eval_stsb_spearman": 0.8454458112091847,
"step": 25625
},
{
"epoch": 1.65,
"eval_avg_sts": 0.7953254322370598,
"eval_sickr_spearman": 0.7452719917849974,
"eval_stsb_spearman": 0.8453788726891222,
"step": 25750
},
{
"epoch": 1.66,
"eval_avg_sts": 0.7952872018869009,
"eval_sickr_spearman": 0.7452931735007315,
"eval_stsb_spearman": 0.8452812302730703,
"step": 25875
},
{
"epoch": 1.66,
"learning_rate": 1.1763727121464225e-06,
"loss": 0.0001,
"step": 26000
},
{
"epoch": 1.66,
"eval_avg_sts": 0.7952607086010879,
"eval_sickr_spearman": 0.7453110410704665,
"eval_stsb_spearman": 0.8452103761317094,
"step": 26000
},
{
"epoch": 1.67,
"eval_avg_sts": 0.7950903508557705,
"eval_sickr_spearman": 0.7449656494200251,
"eval_stsb_spearman": 0.8452150522915161,
"step": 26125
},
{
"epoch": 1.68,
"eval_avg_sts": 0.7950105822340711,
"eval_sickr_spearman": 0.7448497023411534,
"eval_stsb_spearman": 0.8451714621269887,
"step": 26250
},
{
"epoch": 1.69,
"eval_avg_sts": 0.7950131323560599,
"eval_sickr_spearman": 0.744852055865124,
"eval_stsb_spearman": 0.8451742088469958,
"step": 26375
},
{
"epoch": 1.7,
"learning_rate": 1.0643798796877e-06,
"loss": 0.0001,
"step": 26500
},
{
"epoch": 1.7,
"eval_avg_sts": 0.7950484138603111,
"eval_sickr_spearman": 0.7455690161162907,
"eval_stsb_spearman": 0.8445278116043317,
"step": 26500
},
{
"epoch": 1.7,
"eval_avg_sts": 0.7950041615346236,
"eval_sickr_spearman": 0.7455438958502385,
"eval_stsb_spearman": 0.8444644272190087,
"step": 26625
},
{
"epoch": 1.71,
"eval_avg_sts": 0.7946972455858132,
"eval_sickr_spearman": 0.745472569664603,
"eval_stsb_spearman": 0.8439219215070236,
"step": 26750
},
{
"epoch": 1.72,
"eval_avg_sts": 0.7944591743219949,
"eval_sickr_spearman": 0.7454866427773243,
"eval_stsb_spearman": 0.8434317058666653,
"step": 26875
},
{
"epoch": 1.73,
"learning_rate": 9.523870472289774e-07,
"loss": 0.0001,
"step": 27000
},
{
"epoch": 1.73,
"eval_avg_sts": 0.7944066177099748,
"eval_sickr_spearman": 0.7454395722979149,
"eval_stsb_spearman": 0.8433736631220347,
"step": 27000
},
{
"epoch": 1.74,
"eval_avg_sts": 0.7944436945207991,
"eval_sickr_spearman": 0.7455328006658063,
"eval_stsb_spearman": 0.8433545883757919,
"step": 27125
},
{
"epoch": 1.74,
"eval_avg_sts": 0.7944797298738457,
"eval_sickr_spearman": 0.7455790065853898,
"eval_stsb_spearman": 0.8433804531623017,
"step": 27250
},
{
"epoch": 1.75,
"eval_avg_sts": 0.7944698737687554,
"eval_sickr_spearman": 0.7455735310398258,
"eval_stsb_spearman": 0.8433662164976851,
"step": 27375
},
{
"epoch": 1.76,
"learning_rate": 8.403942147702547e-07,
"loss": 0.0001,
"step": 27500
},
{
"epoch": 1.76,
"eval_avg_sts": 0.7942514496393891,
"eval_sickr_spearman": 0.74535724699005,
"eval_stsb_spearman": 0.8431456522887281,
"step": 27500
},
{
"epoch": 1.77,
"eval_avg_sts": 0.7944530448391101,
"eval_sickr_spearman": 0.7454611862935621,
"eval_stsb_spearman": 0.8434449033846582,
"step": 27625
},
{
"epoch": 1.78,
"eval_avg_sts": 0.7944670140899726,
"eval_sickr_spearman": 0.7455168063090274,
"eval_stsb_spearman": 0.8434172218709176,
"step": 27750
},
{
"epoch": 1.78,
"eval_avg_sts": 0.7944968856863333,
"eval_sickr_spearman": 0.7455487469914838,
"eval_stsb_spearman": 0.8434450243811827,
"step": 27875
},
{
"epoch": 1.79,
"learning_rate": 7.284013823115321e-07,
"loss": 0.0001,
"step": 28000
},
{
"epoch": 1.79,
"eval_avg_sts": 0.7944813522912897,
"eval_sickr_spearman": 0.7459449555472468,
"eval_stsb_spearman": 0.8430177490353326,
"step": 28000
},
{
"epoch": 1.8,
"eval_avg_sts": 0.7944717848510598,
"eval_sickr_spearman": 0.7458816025244499,
"eval_stsb_spearman": 0.8430619671776697,
"step": 28125
},
{
"epoch": 1.81,
"eval_avg_sts": 0.7943252967954475,
"eval_sickr_spearman": 0.7455355384385883,
"eval_stsb_spearman": 0.8431150551523066,
"step": 28250
},
{
"epoch": 1.82,
"eval_avg_sts": 0.7945802673668048,
"eval_sickr_spearman": 0.7459384233174512,
"eval_stsb_spearman": 0.8432221114161584,
"step": 28375
},
{
"epoch": 1.82,
"learning_rate": 6.164085498528094e-07,
"loss": 0.0001,
"step": 28500
},
{
"epoch": 1.82,
"eval_avg_sts": 0.7945695711998493,
"eval_sickr_spearman": 0.7459346288604376,
"eval_stsb_spearman": 0.843204513539261,
"step": 28500
},
{
"epoch": 1.83,
"eval_avg_sts": 0.7945396361578374,
"eval_sickr_spearman": 0.7462354956798459,
"eval_stsb_spearman": 0.8428437766358288,
"step": 28625
},
{
"epoch": 1.84,
"eval_avg_sts": 0.7944409539151067,
"eval_sickr_spearman": 0.7461240814315593,
"eval_stsb_spearman": 0.8427578263986542,
"step": 28750
},
{
"epoch": 1.85,
"eval_avg_sts": 0.7940565976087757,
"eval_sickr_spearman": 0.7457283833108623,
"eval_stsb_spearman": 0.8423848119066891,
"step": 28875
},
{
"epoch": 1.86,
"learning_rate": 5.044157173940868e-07,
"loss": 0.0002,
"step": 29000
},
{
"epoch": 1.86,
"eval_avg_sts": 0.7940545279108154,
"eval_sickr_spearman": 0.7457486524356691,
"eval_stsb_spearman": 0.8423604033859617,
"step": 29000
},
{
"epoch": 1.86,
"eval_avg_sts": 0.7940541798236898,
"eval_sickr_spearman": 0.7457327061099918,
"eval_stsb_spearman": 0.8423756535373876,
"step": 29125
},
{
"epoch": 1.87,
"eval_avg_sts": 0.794045870127827,
"eval_sickr_spearman": 0.7457254534136746,
"eval_stsb_spearman": 0.8423662868419793,
"step": 29250
},
{
"epoch": 1.88,
"eval_avg_sts": 0.7939439159521589,
"eval_sickr_spearman": 0.7456850112262637,
"eval_stsb_spearman": 0.8422028206780539,
"step": 29375
},
{
"epoch": 1.89,
"learning_rate": 3.9242288493536413e-07,
"loss": 0.0001,
"step": 29500
},
{
"epoch": 1.89,
"eval_avg_sts": 0.7938843170635432,
"eval_sickr_spearman": 0.7456857797238867,
"eval_stsb_spearman": 0.8420828544031996,
"step": 29500
},
{
"epoch": 1.9,
"eval_avg_sts": 0.7938335370035037,
"eval_sickr_spearman": 0.7456398619909119,
"eval_stsb_spearman": 0.8420272120160953,
"step": 29625
},
{
"epoch": 1.9,
"eval_avg_sts": 0.7937791099281831,
"eval_sickr_spearman": 0.7455667765481975,
"eval_stsb_spearman": 0.8419914433081688,
"step": 29750
},
{
"epoch": 1.91,
"eval_avg_sts": 0.7937599626397398,
"eval_sickr_spearman": 0.7455335691634293,
"eval_stsb_spearman": 0.8419863561160503,
"step": 29875
},
{
"epoch": 1.92,
"learning_rate": 2.804300524766415e-07,
"loss": 0.0001,
"step": 30000
},
{
"epoch": 1.92,
"eval_avg_sts": 0.7937406443684292,
"eval_sickr_spearman": 0.7454874593060488,
"eval_stsb_spearman": 0.8419938294308097,
"step": 30000
},
{
"epoch": 1.93,
"eval_avg_sts": 0.7939020781683644,
"eval_sickr_spearman": 0.7457190652771832,
"eval_stsb_spearman": 0.8420850910595457,
"step": 30125
},
{
"epoch": 1.94,
"eval_avg_sts": 0.7938812791358627,
"eval_sickr_spearman": 0.7456977394681448,
"eval_stsb_spearman": 0.8420648188035805,
"step": 30250
},
{
"epoch": 1.94,
"eval_avg_sts": 0.7937378630658074,
"eval_sickr_spearman": 0.7454741066598489,
"eval_stsb_spearman": 0.842001619471766,
"step": 30375
},
{
"epoch": 1.95,
"learning_rate": 1.6843722001791884e-07,
"loss": 0.0002,
"step": 30500
},
{
"epoch": 1.95,
"eval_avg_sts": 0.7937467005092009,
"eval_sickr_spearman": 0.7454940875980473,
"eval_stsb_spearman": 0.8419993134203545,
"step": 30500
},
{
"epoch": 1.96,
"eval_avg_sts": 0.7937544654414969,
"eval_sickr_spearman": 0.7454804467652388,
"eval_stsb_spearman": 0.8420284841177549,
"step": 30625
},
{
"epoch": 1.97,
"eval_avg_sts": 0.7937753802718709,
"eval_sickr_spearman": 0.7455158937181001,
"eval_stsb_spearman": 0.8420348668256417,
"step": 30750
},
{
"epoch": 1.98,
"eval_avg_sts": 0.7937608907538469,
"eval_sickr_spearman": 0.745488035679266,
"eval_stsb_spearman": 0.8420337458284277,
"step": 30875
},
{
"epoch": 1.98,
"learning_rate": 5.64443875591962e-08,
"loss": 0.0001,
"step": 31000
},
{
"epoch": 1.98,
"eval_avg_sts": 0.7937471629995045,
"eval_sickr_spearman": 0.7454658933415031,
"eval_stsb_spearman": 0.8420284326575058,
"step": 31000
},
{
"epoch": 1.99,
"eval_avg_sts": 0.7937690011247767,
"eval_sickr_spearman": 0.7455096977060146,
"eval_stsb_spearman": 0.8420283045435387,
"step": 31125
},
{
"epoch": 2.0,
"eval_avg_sts": 0.7937804647459197,
"eval_sickr_spearman": 0.7455530217595118,
"eval_stsb_spearman": 0.8420079077323277,
"step": 31250
},
{
"epoch": 2.0,
"step": 31252,
"train_runtime": 9641.8618,
"train_samples_per_second": 3.241
}
],
"max_steps": 31252,
"num_train_epochs": 2,
"total_flos": 333421219511531712,
"trial_name": null,
"trial_params": null
}