{ "best_metric": 0.8634219634166282, "best_model_checkpoint": "result/large-202201021402/unsup-119", "epoch": 1.0, "global_step": 15626, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "eval_avg_sts": 0.6173750067593105, "eval_sickr_spearman": 0.6012189855647659, "eval_stsb_spearman": 0.633531027953855, "step": 125 }, { "epoch": 0.02, "eval_avg_sts": 0.6628010365003804, "eval_sickr_spearman": 0.6482342292074627, "eval_stsb_spearman": 0.6773678437932981, "step": 250 }, { "epoch": 0.02, "eval_avg_sts": 0.7282832479999479, "eval_sickr_spearman": 0.7101949744669466, "eval_stsb_spearman": 0.7463715215329493, "step": 375 }, { "epoch": 0.03, "learning_rate": 9.680020478689364e-06, "loss": 1.4084, "step": 500 }, { "epoch": 0.03, "eval_avg_sts": 0.738101759870555, "eval_sickr_spearman": 0.7213240688567659, "eval_stsb_spearman": 0.7548794508843443, "step": 500 }, { "epoch": 0.04, "eval_avg_sts": 0.7653884278548279, "eval_sickr_spearman": 0.7448660809467439, "eval_stsb_spearman": 0.7859107747629118, "step": 625 }, { "epoch": 0.05, "eval_avg_sts": 0.7739443328792432, "eval_sickr_spearman": 0.7523560028739017, "eval_stsb_spearman": 0.7955326628845848, "step": 750 }, { "epoch": 0.06, "eval_avg_sts": 0.7774626304280415, "eval_sickr_spearman": 0.7556382081906752, "eval_stsb_spearman": 0.7992870526654079, "step": 875 }, { "epoch": 0.06, "learning_rate": 9.36004095737873e-06, "loss": 1.3838, "step": 1000 }, { "epoch": 0.06, "eval_avg_sts": 0.7818787381829664, "eval_sickr_spearman": 0.7586150317645051, "eval_stsb_spearman": 0.8051424446014276, "step": 1000 }, { "epoch": 0.07, "eval_avg_sts": 0.7875780428353734, "eval_sickr_spearman": 0.7643657955396903, "eval_stsb_spearman": 0.8107902901310564, "step": 1125 }, { "epoch": 0.08, "eval_avg_sts": 0.7962537269069103, "eval_sickr_spearman": 0.7713706513734246, "eval_stsb_spearman": 0.8211368024403959, "step": 1250 }, { "epoch": 0.09, "eval_avg_sts": 0.7979229698983594, "eval_sickr_spearman": 0.7717030746264779, "eval_stsb_spearman": 0.8241428651702408, "step": 1375 }, { "epoch": 0.1, "learning_rate": 9.040061436068092e-06, "loss": 1.3838, "step": 1500 }, { "epoch": 0.1, "eval_avg_sts": 0.7975552076492964, "eval_sickr_spearman": 0.7733297919699839, "eval_stsb_spearman": 0.8217806233286091, "step": 1500 }, { "epoch": 0.1, "eval_avg_sts": 0.7995244315661667, "eval_sickr_spearman": 0.7741879636593786, "eval_stsb_spearman": 0.8248608994729549, "step": 1625 }, { "epoch": 0.11, "eval_avg_sts": 0.8013845059958824, "eval_sickr_spearman": 0.7711456736942885, "eval_stsb_spearman": 0.8316233382974761, "step": 1750 }, { "epoch": 0.12, "eval_avg_sts": 0.8016675955064965, "eval_sickr_spearman": 0.7721122996107306, "eval_stsb_spearman": 0.8312228914022624, "step": 1875 }, { "epoch": 0.13, "learning_rate": 8.720081914757458e-06, "loss": 1.3834, "step": 2000 }, { "epoch": 0.13, "eval_avg_sts": 0.8089501146520826, "eval_sickr_spearman": 0.7714815551866453, "eval_stsb_spearman": 0.8464186741175197, "step": 2000 }, { "epoch": 0.14, "eval_avg_sts": 0.8070369744020635, "eval_sickr_spearman": 0.7729106725788348, "eval_stsb_spearman": 0.8411632762252921, "step": 2125 }, { "epoch": 0.14, "eval_avg_sts": 0.8088242480333958, "eval_sickr_spearman": 0.7714153202977622, "eval_stsb_spearman": 0.8462331757690296, "step": 2250 }, { "epoch": 0.15, "eval_avg_sts": 0.8099469364414773, "eval_sickr_spearman": 0.7725471251720497, "eval_stsb_spearman": 0.8473467477109048, "step": 2375 }, { "epoch": 0.16, "learning_rate": 8.400102393446819e-06, "loss": 1.3832, "step": 2500 }, { "epoch": 0.16, "eval_avg_sts": 0.8131048878389238, "eval_sickr_spearman": 0.7713064337908019, "eval_stsb_spearman": 0.8549033418870456, "step": 2500 }, { "epoch": 0.17, "eval_avg_sts": 0.8164488766748953, "eval_sickr_spearman": 0.7764046470218489, "eval_stsb_spearman": 0.8564931063279417, "step": 2625 }, { "epoch": 0.18, "eval_avg_sts": 0.8175873157593689, "eval_sickr_spearman": 0.7767230451932822, "eval_stsb_spearman": 0.8584515863254557, "step": 2750 }, { "epoch": 0.18, "eval_avg_sts": 0.8166403679630079, "eval_sickr_spearman": 0.7760516664573802, "eval_stsb_spearman": 0.8572290694686354, "step": 2875 }, { "epoch": 0.19, "learning_rate": 8.080122872136184e-06, "loss": 1.3833, "step": 3000 }, { "epoch": 0.19, "eval_avg_sts": 0.8157693460916737, "eval_sickr_spearman": 0.7743323451503016, "eval_stsb_spearman": 0.857206347033046, "step": 3000 }, { "epoch": 0.2, "eval_avg_sts": 0.8150392842710488, "eval_sickr_spearman": 0.7724294970046278, "eval_stsb_spearman": 0.8576490715374696, "step": 3125 }, { "epoch": 0.21, "eval_avg_sts": 0.8151962431424102, "eval_sickr_spearman": 0.7735117337822314, "eval_stsb_spearman": 0.8568807525025892, "step": 3250 }, { "epoch": 0.22, "eval_avg_sts": 0.8170086003442181, "eval_sickr_spearman": 0.7705952372718078, "eval_stsb_spearman": 0.8634219634166282, "step": 3375 }, { "epoch": 0.22, "learning_rate": 7.760143350825547e-06, "loss": 1.3834, "step": 3500 }, { "epoch": 0.22, "eval_avg_sts": 0.8154897129691365, "eval_sickr_spearman": 0.7761568545695297, "eval_stsb_spearman": 0.8548225713687434, "step": 3500 }, { "epoch": 0.23, "eval_avg_sts": 0.8196396828185117, "eval_sickr_spearman": 0.779249721284434, "eval_stsb_spearman": 0.8600296443525893, "step": 3625 }, { "epoch": 0.24, "eval_avg_sts": 0.8178347113315759, "eval_sickr_spearman": 0.7778026882914081, "eval_stsb_spearman": 0.8578667343717438, "step": 3750 }, { "epoch": 0.25, "eval_avg_sts": 0.8171697922813259, "eval_sickr_spearman": 0.7775901986986459, "eval_stsb_spearman": 0.8567493858640058, "step": 3875 }, { "epoch": 0.26, "learning_rate": 7.440163829514912e-06, "loss": 1.3833, "step": 4000 }, { "epoch": 0.26, "eval_avg_sts": 0.8174402673423591, "eval_sickr_spearman": 0.7767179538965296, "eval_stsb_spearman": 0.8581625807881884, "step": 4000 }, { "epoch": 0.26, "eval_avg_sts": 0.8155577027909464, "eval_sickr_spearman": 0.7732734995190984, "eval_stsb_spearman": 0.8578419060627945, "step": 4125 }, { "epoch": 0.27, "eval_avg_sts": 0.8147469901498937, "eval_sickr_spearman": 0.771565513551959, "eval_stsb_spearman": 0.8579284667478284, "step": 4250 }, { "epoch": 0.28, "eval_avg_sts": 0.8132680914978344, "eval_sickr_spearman": 0.7705074364183789, "eval_stsb_spearman": 0.8560287465772899, "step": 4375 }, { "epoch": 0.29, "learning_rate": 7.120184308204276e-06, "loss": 1.3831, "step": 4500 }, { "epoch": 0.29, "eval_avg_sts": 0.8111781546061814, "eval_sickr_spearman": 0.767962124259869, "eval_stsb_spearman": 0.8543941849524939, "step": 4500 }, { "epoch": 0.3, "eval_avg_sts": 0.8067605181721469, "eval_sickr_spearman": 0.7667528452189616, "eval_stsb_spearman": 0.8467681911253321, "step": 4625 }, { "epoch": 0.3, "eval_avg_sts": 0.805061635624042, "eval_sickr_spearman": 0.7615015511281912, "eval_stsb_spearman": 0.8486217201198928, "step": 4750 }, { "epoch": 0.31, "eval_avg_sts": 0.8038471796528851, "eval_sickr_spearman": 0.7597667215147881, "eval_stsb_spearman": 0.8479276377909821, "step": 4875 }, { "epoch": 0.32, "learning_rate": 6.800204786893639e-06, "loss": 1.3832, "step": 5000 }, { "epoch": 0.32, "eval_avg_sts": 0.804331555739771, "eval_sickr_spearman": 0.7603548623518979, "eval_stsb_spearman": 0.8483082491276442, "step": 5000 }, { "epoch": 0.33, "eval_avg_sts": 0.8053511928015219, "eval_sickr_spearman": 0.7614074159088126, "eval_stsb_spearman": 0.8492949696942312, "step": 5125 }, { "epoch": 0.34, "eval_avg_sts": 0.7985432237233677, "eval_sickr_spearman": 0.7516314537087078, "eval_stsb_spearman": 0.8454549937380277, "step": 5250 }, { "epoch": 0.34, "eval_avg_sts": 0.800089668096919, "eval_sickr_spearman": 0.7562339379418122, "eval_stsb_spearman": 0.8439453982520256, "step": 5375 }, { "epoch": 0.35, "learning_rate": 6.480225265583003e-06, "loss": 1.3833, "step": 5500 }, { "epoch": 0.35, "eval_avg_sts": 0.7995108246181313, "eval_sickr_spearman": 0.7555560269761146, "eval_stsb_spearman": 0.843465622260148, "step": 5500 }, { "epoch": 0.36, "eval_avg_sts": 0.7946854334729495, "eval_sickr_spearman": 0.7501423454708219, "eval_stsb_spearman": 0.8392285214750771, "step": 5625 }, { "epoch": 0.37, "eval_avg_sts": 0.7938089772181914, "eval_sickr_spearman": 0.7494677486511236, "eval_stsb_spearman": 0.8381502057852592, "step": 5750 }, { "epoch": 0.38, "eval_avg_sts": 0.7994330810887486, "eval_sickr_spearman": 0.7598704148842054, "eval_stsb_spearman": 0.8389957472932917, "step": 5875 }, { "epoch": 0.38, "learning_rate": 6.1602457442723675e-06, "loss": 1.3831, "step": 6000 }, { "epoch": 0.38, "eval_avg_sts": 0.8006950402497293, "eval_sickr_spearman": 0.7590634501275313, "eval_stsb_spearman": 0.8423266303719271, "step": 6000 }, { "epoch": 0.39, "eval_avg_sts": 0.7981365664953497, "eval_sickr_spearman": 0.7573632932299265, "eval_stsb_spearman": 0.8389098397607728, "step": 6125 }, { "epoch": 0.4, "eval_avg_sts": 0.797260786393159, "eval_sickr_spearman": 0.7531412633513134, "eval_stsb_spearman": 0.8413803094350046, "step": 6250 }, { "epoch": 0.41, "eval_avg_sts": 0.8002525553253802, "eval_sickr_spearman": 0.7581138752520997, "eval_stsb_spearman": 0.8423912353986607, "step": 6375 }, { "epoch": 0.42, "learning_rate": 5.840266222961732e-06, "loss": 1.3833, "step": 6500 }, { "epoch": 0.42, "eval_avg_sts": 0.8002113456211982, "eval_sickr_spearman": 0.7571126189115208, "eval_stsb_spearman": 0.8433100723308756, "step": 6500 }, { "epoch": 0.42, "eval_avg_sts": 0.7918930851566096, "eval_sickr_spearman": 0.7477064481613881, "eval_stsb_spearman": 0.8360797221518311, "step": 6625 }, { "epoch": 0.43, "eval_avg_sts": 0.7924510170045258, "eval_sickr_spearman": 0.7493739439100151, "eval_stsb_spearman": 0.8355280900990365, "step": 6750 }, { "epoch": 0.44, "eval_avg_sts": 0.7945927190512974, "eval_sickr_spearman": 0.7502740947820667, "eval_stsb_spearman": 0.8389113433205279, "step": 6875 }, { "epoch": 0.45, "learning_rate": 5.520286701651095e-06, "loss": 1.3831, "step": 7000 }, { "epoch": 0.45, "eval_avg_sts": 0.794468123371008, "eval_sickr_spearman": 0.7500643909931879, "eval_stsb_spearman": 0.8388718557488282, "step": 7000 }, { "epoch": 0.46, "eval_avg_sts": 0.7942224614102554, "eval_sickr_spearman": 0.7504599271135308, "eval_stsb_spearman": 0.83798499570698, "step": 7125 }, { "epoch": 0.46, "eval_avg_sts": 0.793212714758925, "eval_sickr_spearman": 0.7516163719428562, "eval_stsb_spearman": 0.8348090575749938, "step": 7250 }, { "epoch": 0.47, "eval_avg_sts": 0.791642468147763, "eval_sickr_spearman": 0.748681383458379, "eval_stsb_spearman": 0.834603552837147, "step": 7375 }, { "epoch": 0.48, "learning_rate": 5.200307180340458e-06, "loss": 1.3831, "step": 7500 }, { "epoch": 0.48, "eval_avg_sts": 0.792711907370149, "eval_sickr_spearman": 0.7461013928446307, "eval_stsb_spearman": 0.8393224218956672, "step": 7500 }, { "epoch": 0.49, "eval_avg_sts": 0.7925208114993505, "eval_sickr_spearman": 0.7451070049515575, "eval_stsb_spearman": 0.8399346180471436, "step": 7625 }, { "epoch": 0.5, "eval_avg_sts": 0.7926421702060152, "eval_sickr_spearman": 0.7462153706483433, "eval_stsb_spearman": 0.8390689697636872, "step": 7750 }, { "epoch": 0.5, "eval_avg_sts": 0.7919285173732868, "eval_sickr_spearman": 0.7432351368663114, "eval_stsb_spearman": 0.8406218978802623, "step": 7875 }, { "epoch": 0.51, "learning_rate": 4.8803276590298225e-06, "loss": 1.3832, "step": 8000 }, { "epoch": 0.51, "eval_avg_sts": 0.7903254153370375, "eval_sickr_spearman": 0.7435248604701861, "eval_stsb_spearman": 0.8371259702038889, "step": 8000 }, { "epoch": 0.52, "eval_avg_sts": 0.7961442221524222, "eval_sickr_spearman": 0.7458505264018194, "eval_stsb_spearman": 0.846437917903025, "step": 8125 }, { "epoch": 0.53, "eval_avg_sts": 0.7950454156593848, "eval_sickr_spearman": 0.7449886082865125, "eval_stsb_spearman": 0.8451022230322571, "step": 8250 }, { "epoch": 0.54, "eval_avg_sts": 0.792686108913305, "eval_sickr_spearman": 0.7417272484677632, "eval_stsb_spearman": 0.8436449693588469, "step": 8375 }, { "epoch": 0.54, "learning_rate": 4.560348137719187e-06, "loss": 1.3831, "step": 8500 }, { "epoch": 0.54, "eval_avg_sts": 0.790817425934377, "eval_sickr_spearman": 0.7411045732687196, "eval_stsb_spearman": 0.8405302786000344, "step": 8500 }, { "epoch": 0.55, "eval_avg_sts": 0.7901648543781281, "eval_sickr_spearman": 0.7389814064607493, "eval_stsb_spearman": 0.8413483022955068, "step": 8625 }, { "epoch": 0.56, "eval_avg_sts": 0.790240059757523, "eval_sickr_spearman": 0.7385863506514208, "eval_stsb_spearman": 0.8418937688636251, "step": 8750 }, { "epoch": 0.57, "eval_avg_sts": 0.7887051283167092, "eval_sickr_spearman": 0.7367630420097286, "eval_stsb_spearman": 0.8406472146236897, "step": 8875 }, { "epoch": 0.58, "learning_rate": 4.24036861640855e-06, "loss": 1.383, "step": 9000 }, { "epoch": 0.58, "eval_avg_sts": 0.7877125146130246, "eval_sickr_spearman": 0.7356615927915497, "eval_stsb_spearman": 0.8397634364344995, "step": 9000 }, { "epoch": 0.58, "eval_avg_sts": 0.7874836125360063, "eval_sickr_spearman": 0.7346168683041693, "eval_stsb_spearman": 0.8403503567678434, "step": 9125 }, { "epoch": 0.59, "eval_avg_sts": 0.7874954897759103, "eval_sickr_spearman": 0.7342269518226948, "eval_stsb_spearman": 0.8407640277291258, "step": 9250 }, { "epoch": 0.6, "eval_avg_sts": 0.784178959071547, "eval_sickr_spearman": 0.7294457438611393, "eval_stsb_spearman": 0.8389121742819547, "step": 9375 }, { "epoch": 0.61, "learning_rate": 3.920389095097914e-06, "loss": 1.3831, "step": 9500 }, { "epoch": 0.61, "eval_avg_sts": 0.7831583604230383, "eval_sickr_spearman": 0.7287413197274478, "eval_stsb_spearman": 0.8375754011186287, "step": 9500 }, { "epoch": 0.62, "eval_avg_sts": 0.7836660632246585, "eval_sickr_spearman": 0.7300298981168296, "eval_stsb_spearman": 0.8373022283324874, "step": 9625 }, { "epoch": 0.62, "eval_avg_sts": 0.7815441234971521, "eval_sickr_spearman": 0.7273786773796486, "eval_stsb_spearman": 0.8357095696146557, "step": 9750 }, { "epoch": 0.63, "eval_avg_sts": 0.7885847398548176, "eval_sickr_spearman": 0.7416071226830666, "eval_stsb_spearman": 0.8355623570265684, "step": 9875 }, { "epoch": 0.64, "learning_rate": 3.600409573787278e-06, "loss": 1.3833, "step": 10000 }, { "epoch": 0.64, "eval_avg_sts": 0.789407852748685, "eval_sickr_spearman": 0.7440142973938404, "eval_stsb_spearman": 0.8348014081035294, "step": 10000 }, { "epoch": 0.65, "eval_avg_sts": 0.7887440580577265, "eval_sickr_spearman": 0.7422862344262999, "eval_stsb_spearman": 0.8352018816891532, "step": 10125 }, { "epoch": 0.66, "eval_avg_sts": 0.7877943614348063, "eval_sickr_spearman": 0.7412599538818719, "eval_stsb_spearman": 0.8343287689877407, "step": 10250 }, { "epoch": 0.66, "eval_avg_sts": 0.7870675080484348, "eval_sickr_spearman": 0.7398324695471311, "eval_stsb_spearman": 0.8343025465497387, "step": 10375 }, { "epoch": 0.67, "learning_rate": 3.280430052476642e-06, "loss": 1.383, "step": 10500 }, { "epoch": 0.67, "eval_avg_sts": 0.7855316903809282, "eval_sickr_spearman": 0.7367247131907809, "eval_stsb_spearman": 0.8343386675710754, "step": 10500 }, { "epoch": 0.68, "eval_avg_sts": 0.7851246296450775, "eval_sickr_spearman": 0.736261645341816, "eval_stsb_spearman": 0.8339876139483389, "step": 10625 }, { "epoch": 0.69, "eval_avg_sts": 0.7841961737035235, "eval_sickr_spearman": 0.7354697085413046, "eval_stsb_spearman": 0.8329226388657422, "step": 10750 }, { "epoch": 0.7, "eval_avg_sts": 0.7838315084569085, "eval_sickr_spearman": 0.7345151864624249, "eval_stsb_spearman": 0.8331478304513922, "step": 10875 }, { "epoch": 0.7, "learning_rate": 2.960450531166006e-06, "loss": 1.3829, "step": 11000 }, { "epoch": 0.7, "eval_avg_sts": 0.783352664817645, "eval_sickr_spearman": 0.7336182536741696, "eval_stsb_spearman": 0.8330870759611203, "step": 11000 }, { "epoch": 0.71, "eval_avg_sts": 0.7841170693562891, "eval_sickr_spearman": 0.7346750819991124, "eval_stsb_spearman": 0.8335590567134659, "step": 11125 }, { "epoch": 0.72, "eval_avg_sts": 0.7839455311656613, "eval_sickr_spearman": 0.7335271867058429, "eval_stsb_spearman": 0.8343638756254798, "step": 11250 }, { "epoch": 0.73, "eval_avg_sts": 0.7858793093736349, "eval_sickr_spearman": 0.7367065094033358, "eval_stsb_spearman": 0.8350521093439339, "step": 11375 }, { "epoch": 0.74, "learning_rate": 2.640471009855369e-06, "loss": 1.383, "step": 11500 }, { "epoch": 0.74, "eval_avg_sts": 0.785960141552553, "eval_sickr_spearman": 0.7368878748423662, "eval_stsb_spearman": 0.8350324082627398, "step": 11500 }, { "epoch": 0.74, "eval_avg_sts": 0.7827362717943076, "eval_sickr_spearman": 0.7345604317599795, "eval_stsb_spearman": 0.8309121118286357, "step": 11625 }, { "epoch": 0.75, "eval_avg_sts": 0.782151314040066, "eval_sickr_spearman": 0.7333196443165289, "eval_stsb_spearman": 0.8309829837636032, "step": 11750 }, { "epoch": 0.76, "eval_avg_sts": 0.7814914570298286, "eval_sickr_spearman": 0.7326789574544458, "eval_stsb_spearman": 0.8303039566052115, "step": 11875 }, { "epoch": 0.77, "learning_rate": 2.3204914885447333e-06, "loss": 1.3831, "step": 12000 }, { "epoch": 0.77, "eval_avg_sts": 0.7813092418170919, "eval_sickr_spearman": 0.7323319807776568, "eval_stsb_spearman": 0.830286502856527, "step": 12000 }, { "epoch": 0.78, "eval_avg_sts": 0.7801988249710072, "eval_sickr_spearman": 0.7320945630432483, "eval_stsb_spearman": 0.8283030868987663, "step": 12125 }, { "epoch": 0.78, "eval_avg_sts": 0.781174501892351, "eval_sickr_spearman": 0.7298683695226933, "eval_stsb_spearman": 0.8324806342620087, "step": 12250 }, { "epoch": 0.79, "eval_avg_sts": 0.7816701818675454, "eval_sickr_spearman": 0.7288407921385262, "eval_stsb_spearman": 0.8344995715965647, "step": 12375 }, { "epoch": 0.8, "learning_rate": 2.000511967234097e-06, "loss": 1.383, "step": 12500 }, { "epoch": 0.8, "eval_avg_sts": 0.7812274276555035, "eval_sickr_spearman": 0.7285719140326756, "eval_stsb_spearman": 0.8338829412783313, "step": 12500 }, { "epoch": 0.81, "eval_avg_sts": 0.7811766812929849, "eval_sickr_spearman": 0.728695834274386, "eval_stsb_spearman": 0.8336575283115838, "step": 12625 }, { "epoch": 0.82, "eval_avg_sts": 0.7811575997131124, "eval_sickr_spearman": 0.7288844524097335, "eval_stsb_spearman": 0.8334307470164913, "step": 12750 }, { "epoch": 0.82, "eval_avg_sts": 0.7808650964963647, "eval_sickr_spearman": 0.7288432417246996, "eval_stsb_spearman": 0.8328869512680298, "step": 12875 }, { "epoch": 0.83, "learning_rate": 1.6805324459234608e-06, "loss": 1.3829, "step": 13000 }, { "epoch": 0.83, "eval_avg_sts": 0.7803803908797147, "eval_sickr_spearman": 0.7284006351249473, "eval_stsb_spearman": 0.832360146634482, "step": 13000 }, { "epoch": 0.84, "eval_avg_sts": 0.7805076637365365, "eval_sickr_spearman": 0.7283448710161777, "eval_stsb_spearman": 0.8326704564568952, "step": 13125 }, { "epoch": 0.85, "eval_avg_sts": 0.7805681692685815, "eval_sickr_spearman": 0.7283289246905003, "eval_stsb_spearman": 0.8328074138466628, "step": 13250 }, { "epoch": 0.86, "eval_avg_sts": 0.7804400499004719, "eval_sickr_spearman": 0.7275362193923656, "eval_stsb_spearman": 0.8333438804085782, "step": 13375 }, { "epoch": 0.86, "learning_rate": 1.3605529246128248e-06, "loss": 1.383, "step": 13500 }, { "epoch": 0.86, "eval_avg_sts": 0.7797914718222148, "eval_sickr_spearman": 0.727398562255644, "eval_stsb_spearman": 0.8321843813887856, "step": 13500 }, { "epoch": 0.87, "eval_avg_sts": 0.7783159916436958, "eval_sickr_spearman": 0.7271253547861919, "eval_stsb_spearman": 0.8295066285011997, "step": 13625 }, { "epoch": 0.88, "eval_avg_sts": 0.7787465759811611, "eval_sickr_spearman": 0.7272892434687709, "eval_stsb_spearman": 0.8302039084935513, "step": 13750 }, { "epoch": 0.89, "eval_avg_sts": 0.7785133054722726, "eval_sickr_spearman": 0.7278318027906158, "eval_stsb_spearman": 0.8291948081539294, "step": 13875 }, { "epoch": 0.9, "learning_rate": 1.0405734033021888e-06, "loss": 1.383, "step": 14000 }, { "epoch": 0.9, "eval_avg_sts": 0.7785313836357052, "eval_sickr_spearman": 0.7276787276703326, "eval_stsb_spearman": 0.8293840396010778, "step": 14000 }, { "epoch": 0.9, "eval_avg_sts": 0.7781951381943462, "eval_sickr_spearman": 0.7266623415328006, "eval_stsb_spearman": 0.8297279348558916, "step": 14125 }, { "epoch": 0.91, "eval_avg_sts": 0.7782565319241563, "eval_sickr_spearman": 0.7269010080758466, "eval_stsb_spearman": 0.8296120557724662, "step": 14250 }, { "epoch": 0.92, "eval_avg_sts": 0.778284639461994, "eval_sickr_spearman": 0.7268794421113008, "eval_stsb_spearman": 0.8296898368126872, "step": 14375 }, { "epoch": 0.93, "learning_rate": 7.205938819915525e-07, "loss": 1.3831, "step": 14500 }, { "epoch": 0.93, "eval_avg_sts": 0.7782895613239478, "eval_sickr_spearman": 0.7268127269114034, "eval_stsb_spearman": 0.8297663957364921, "step": 14500 }, { "epoch": 0.94, "eval_avg_sts": 0.7789978370464021, "eval_sickr_spearman": 0.7271919804883588, "eval_stsb_spearman": 0.8308036936044454, "step": 14625 }, { "epoch": 0.94, "eval_avg_sts": 0.7790931167137354, "eval_sickr_spearman": 0.7273074952873174, "eval_stsb_spearman": 0.8308787381401533, "step": 14750 }, { "epoch": 0.95, "eval_avg_sts": 0.779219715499812, "eval_sickr_spearman": 0.7275282942606284, "eval_stsb_spearman": 0.8309111367389955, "step": 14875 }, { "epoch": 0.96, "learning_rate": 4.0061436068091647e-07, "loss": 1.383, "step": 15000 }, { "epoch": 0.96, "eval_avg_sts": 0.7791063980264322, "eval_sickr_spearman": 0.7273648924535359, "eval_stsb_spearman": 0.8308479035993286, "step": 15000 }, { "epoch": 0.97, "eval_avg_sts": 0.7790852665632677, "eval_sickr_spearman": 0.7270619122656642, "eval_stsb_spearman": 0.8311086208608711, "step": 15125 }, { "epoch": 0.98, "eval_avg_sts": 0.7791667180857071, "eval_sickr_spearman": 0.727271616054543, "eval_stsb_spearman": 0.8310618201168714, "step": 15250 }, { "epoch": 0.98, "eval_avg_sts": 0.7791280335279434, "eval_sickr_spearman": 0.7271601838992067, "eval_stsb_spearman": 0.83109588315668, "step": 15375 }, { "epoch": 0.99, "learning_rate": 8.06348393702803e-08, "loss": 1.383, "step": 15500 }, { "epoch": 0.99, "eval_avg_sts": 0.7791498757767996, "eval_sickr_spearman": 0.7272329990489868, "eval_stsb_spearman": 0.8310667525046124, "step": 15500 }, { "epoch": 1.0, "eval_avg_sts": 0.7791357795668019, "eval_sickr_spearman": 0.7272119133954554, "eval_stsb_spearman": 0.8310596457381484, "step": 15625 }, { "epoch": 1.0, "step": 15626, "train_runtime": 12960.19, "train_samples_per_second": 1.206 } ], "max_steps": 15626, "num_train_epochs": 1, "total_flos": 321736534216212480, "trial_name": null, "trial_params": null }