{ "best_metric": 0.6788413098236775, "best_model_checkpoint": "trained_models/wnut_17/checkpoint-9000", "epoch": 21.176470588235293, "global_step": 9000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.24, "eval_accuracy_score": 0.9205491641772071, "eval_f1": 0.0, "eval_loss": 0.5049907565116882, "eval_precision": 0.0, "eval_recall": 0.0, "eval_runtime": 6.761, "eval_samples_per_second": 149.239, "eval_steps_per_second": 18.784, "step": 100 }, { "epoch": 0.47, "eval_accuracy_score": 0.9205491641772071, "eval_f1": 0.0, "eval_loss": 0.48477333784103394, "eval_precision": 0.0, "eval_recall": 0.0, "eval_runtime": 6.7798, "eval_samples_per_second": 148.825, "eval_steps_per_second": 18.732, "step": 200 }, { "epoch": 0.71, "eval_accuracy_score": 0.9205491641772071, "eval_f1": 0.0, "eval_loss": 0.3834511935710907, "eval_precision": 0.0, "eval_recall": 0.0, "eval_runtime": 6.7494, "eval_samples_per_second": 149.494, "eval_steps_per_second": 18.816, "step": 300 }, { "epoch": 0.94, "eval_accuracy_score": 0.9218203775503718, "eval_f1": 0.016241299303944315, "eval_loss": 0.3428375720977783, "eval_precision": 0.2692307692307692, "eval_recall": 0.008373205741626795, "eval_runtime": 6.7397, "eval_samples_per_second": 149.711, "eval_steps_per_second": 18.844, "step": 400 }, { "epoch": 1.18, "learning_rate": 4.803921568627452e-06, "loss": 0.4388, "step": 500 }, { "epoch": 1.18, "eval_accuracy_score": 0.9387275154134621, "eval_f1": 0.3550877192982456, "eval_loss": 0.31836700439453125, "eval_precision": 0.4295415959252971, "eval_recall": 0.3026315789473684, "eval_runtime": 6.749, "eval_samples_per_second": 149.504, "eval_steps_per_second": 18.818, "step": 500 }, { "epoch": 1.41, "eval_accuracy_score": 0.9413335028284497, "eval_f1": 0.40223463687150846, "eval_loss": 0.3077085316181183, "eval_precision": 0.48322147651006714, "eval_recall": 0.3444976076555024, "eval_runtime": 7.2416, "eval_samples_per_second": 139.333, "eval_steps_per_second": 17.537, "step": 600 }, { "epoch": 1.65, "eval_accuracy_score": 0.9449564609419691, "eval_f1": 0.46935933147632314, "eval_loss": 0.29629671573638916, "eval_precision": 0.5616666666666666, "eval_recall": 0.40311004784689, "eval_runtime": 6.7314, "eval_samples_per_second": 149.895, "eval_steps_per_second": 18.867, "step": 700 }, { "epoch": 1.88, "eval_accuracy_score": 0.9471810843450074, "eval_f1": 0.5139186295503213, "eval_loss": 0.2875679135322571, "eval_precision": 0.6371681415929203, "eval_recall": 0.430622009569378, "eval_runtime": 6.7537, "eval_samples_per_second": 149.401, "eval_steps_per_second": 18.805, "step": 800 }, { "epoch": 2.12, "eval_accuracy_score": 0.949278586410729, "eval_f1": 0.5329849771391247, "eval_loss": 0.27145618200302124, "eval_precision": 0.5870503597122302, "eval_recall": 0.4880382775119617, "eval_runtime": 6.7363, "eval_samples_per_second": 149.786, "eval_steps_per_second": 18.853, "step": 900 }, { "epoch": 2.35, "learning_rate": 4.607843137254902e-06, "loss": 0.1974, "step": 1000 }, { "epoch": 2.35, "eval_accuracy_score": 0.9492150257420708, "eval_f1": 0.5209424083769634, "eval_loss": 0.2602783441543579, "eval_precision": 0.5751445086705202, "eval_recall": 0.47607655502392343, "eval_runtime": 6.736, "eval_samples_per_second": 149.792, "eval_steps_per_second": 18.854, "step": 1000 }, { "epoch": 2.59, "eval_accuracy_score": 0.9504862391152354, "eval_f1": 0.5558510638297872, "eval_loss": 0.24513839185237885, "eval_precision": 0.625748502994012, "eval_recall": 0.5, "eval_runtime": 7.332, "eval_samples_per_second": 137.616, "eval_steps_per_second": 17.321, "step": 1100 }, { "epoch": 2.82, "eval_accuracy_score": 0.9520116951630331, "eval_f1": 0.5626566416040101, "eval_loss": 0.23386946320533752, "eval_precision": 0.5907894736842105, "eval_recall": 0.5370813397129187, "eval_runtime": 6.737, "eval_samples_per_second": 149.771, "eval_steps_per_second": 18.851, "step": 1200 }, { "epoch": 3.06, "eval_accuracy_score": 0.9529651051929067, "eval_f1": 0.5635782747603835, "eval_loss": 0.23247480392456055, "eval_precision": 0.6049382716049383, "eval_recall": 0.527511961722488, "eval_runtime": 6.7326, "eval_samples_per_second": 149.868, "eval_steps_per_second": 18.864, "step": 1300 }, { "epoch": 3.29, "eval_accuracy_score": 0.9557617746138689, "eval_f1": 0.5892526250772081, "eval_loss": 0.2185893952846527, "eval_precision": 0.6091954022988506, "eval_recall": 0.5705741626794258, "eval_runtime": 6.7427, "eval_samples_per_second": 149.643, "eval_steps_per_second": 18.835, "step": 1400 }, { "epoch": 3.53, "learning_rate": 4.411764705882353e-06, "loss": 0.1395, "step": 1500 }, { "epoch": 3.53, "eval_accuracy_score": 0.9572236699930083, "eval_f1": 0.6000000000000001, "eval_loss": 0.2226746827363968, "eval_precision": 0.6464088397790055, "eval_recall": 0.5598086124401914, "eval_runtime": 6.7181, "eval_samples_per_second": 150.191, "eval_steps_per_second": 18.904, "step": 1500 }, { "epoch": 3.76, "eval_accuracy_score": 0.9590033687154389, "eval_f1": 0.598405885959534, "eval_loss": 0.21203213930130005, "eval_precision": 0.6138364779874214, "eval_recall": 0.583732057416268, "eval_runtime": 6.7595, "eval_samples_per_second": 149.27, "eval_steps_per_second": 18.788, "step": 1600 }, { "epoch": 4.0, "eval_accuracy_score": 0.9586855653721477, "eval_f1": 0.618421052631579, "eval_loss": 0.22468985617160797, "eval_precision": 0.6871345029239766, "eval_recall": 0.562200956937799, "eval_runtime": 6.7215, "eval_samples_per_second": 150.115, "eval_steps_per_second": 18.895, "step": 1700 }, { "epoch": 4.24, "eval_accuracy_score": 0.9599567787453124, "eval_f1": 0.6330749354005167, "eval_loss": 0.2214759886264801, "eval_precision": 0.6882022471910112, "eval_recall": 0.5861244019138756, "eval_runtime": 6.7281, "eval_samples_per_second": 149.969, "eval_steps_per_second": 18.876, "step": 1800 }, { "epoch": 4.47, "eval_accuracy_score": 0.96148223479311, "eval_f1": 0.6507115135834413, "eval_loss": 0.21751971542835236, "eval_precision": 0.7084507042253522, "eval_recall": 0.6016746411483254, "eval_runtime": 6.7505, "eval_samples_per_second": 149.471, "eval_steps_per_second": 18.813, "step": 1900 }, { "epoch": 4.71, "learning_rate": 4.215686274509805e-06, "loss": 0.1057, "step": 2000 }, { "epoch": 4.71, "eval_accuracy_score": 0.9605923854318947, "eval_f1": 0.6401062416998671, "eval_loss": 0.22828274965286255, "eval_precision": 0.7194029850746269, "eval_recall": 0.5765550239234449, "eval_runtime": 6.7552, "eval_samples_per_second": 149.366, "eval_steps_per_second": 18.8, "step": 2000 }, { "epoch": 4.94, "eval_accuracy_score": 0.9621814021483506, "eval_f1": 0.6484424666242848, "eval_loss": 0.2120533287525177, "eval_precision": 0.6919945725915875, "eval_recall": 0.6100478468899522, "eval_runtime": 6.7607, "eval_samples_per_second": 149.245, "eval_steps_per_second": 18.785, "step": 2100 }, { "epoch": 5.18, "eval_accuracy_score": 0.9617364774677429, "eval_f1": 0.6427196921103272, "eval_loss": 0.21272720396518707, "eval_precision": 0.6929460580912863, "eval_recall": 0.5992822966507177, "eval_runtime": 6.823, "eval_samples_per_second": 147.882, "eval_steps_per_second": 18.613, "step": 2200 }, { "epoch": 5.41, "eval_accuracy_score": 0.9614186741244518, "eval_f1": 0.6440460947503202, "eval_loss": 0.21506403386592865, "eval_precision": 0.6928374655647382, "eval_recall": 0.6016746411483254, "eval_runtime": 6.7509, "eval_samples_per_second": 149.462, "eval_steps_per_second": 18.812, "step": 2300 }, { "epoch": 5.65, "eval_accuracy_score": 0.9625627661603, "eval_f1": 0.6498740554156172, "eval_loss": 0.20958468317985535, "eval_precision": 0.6861702127659575, "eval_recall": 0.6172248803827751, "eval_runtime": 6.7421, "eval_samples_per_second": 149.656, "eval_steps_per_second": 18.837, "step": 2400 }, { "epoch": 5.88, "learning_rate": 4.019607843137255e-06, "loss": 0.0811, "step": 2500 }, { "epoch": 5.88, "eval_accuracy_score": 0.9624356448229835, "eval_f1": 0.6591337099811676, "eval_loss": 0.2008962631225586, "eval_precision": 0.6935270805812418, "eval_recall": 0.6279904306220095, "eval_runtime": 6.7089, "eval_samples_per_second": 150.397, "eval_steps_per_second": 18.93, "step": 2500 }, { "epoch": 6.12, "eval_accuracy_score": 0.9621178414796924, "eval_f1": 0.6448717948717948, "eval_loss": 0.21091684699058533, "eval_precision": 0.6947513812154696, "eval_recall": 0.6016746411483254, "eval_runtime": 6.7609, "eval_samples_per_second": 149.241, "eval_steps_per_second": 18.785, "step": 2600 }, { "epoch": 6.35, "eval_accuracy_score": 0.9621178414796924, "eval_f1": 0.6499057196731616, "eval_loss": 0.21349507570266724, "eval_precision": 0.6847682119205298, "eval_recall": 0.618421052631579, "eval_runtime": 6.7376, "eval_samples_per_second": 149.757, "eval_steps_per_second": 18.849, "step": 2700 }, { "epoch": 6.59, "eval_accuracy_score": 0.9620542808110342, "eval_f1": 0.6467218332272437, "eval_loss": 0.2102096974849701, "eval_precision": 0.691156462585034, "eval_recall": 0.6076555023923444, "eval_runtime": 6.7394, "eval_samples_per_second": 149.717, "eval_steps_per_second": 18.844, "step": 2800 }, { "epoch": 6.82, "eval_accuracy_score": 0.9630076908409076, "eval_f1": 0.6658385093167701, "eval_loss": 0.2015107125043869, "eval_precision": 0.6925064599483204, "eval_recall": 0.6411483253588517, "eval_runtime": 6.7773, "eval_samples_per_second": 148.879, "eval_steps_per_second": 18.739, "step": 2900 }, { "epoch": 7.06, "learning_rate": 3.8235294117647055e-06, "loss": 0.0674, "step": 3000 }, { "epoch": 7.06, "eval_accuracy_score": 0.96364329752749, "eval_f1": 0.6624921728240452, "eval_loss": 0.20179474353790283, "eval_precision": 0.695137976346912, "eval_recall": 0.6327751196172249, "eval_runtime": 6.8013, "eval_samples_per_second": 148.354, "eval_steps_per_second": 18.673, "step": 3000 }, { "epoch": 7.29, "eval_accuracy_score": 0.9629441301722494, "eval_f1": 0.6454431960049937, "eval_loss": 0.20865464210510254, "eval_precision": 0.674934725848564, "eval_recall": 0.618421052631579, "eval_runtime": 6.7901, "eval_samples_per_second": 148.599, "eval_steps_per_second": 18.704, "step": 3100 }, { "epoch": 7.53, "eval_accuracy_score": 0.9631983728468824, "eval_f1": 0.6507237256135934, "eval_loss": 0.2077988088130951, "eval_precision": 0.6865869853917662, "eval_recall": 0.618421052631579, "eval_runtime": 6.7566, "eval_samples_per_second": 149.335, "eval_steps_per_second": 18.796, "step": 3200 }, { "epoch": 7.76, "eval_accuracy_score": 0.9626898874976165, "eval_f1": 0.6499678869621066, "eval_loss": 0.2155311405658722, "eval_precision": 0.7018030513176144, "eval_recall": 0.6052631578947368, "eval_runtime": 6.7572, "eval_samples_per_second": 149.321, "eval_steps_per_second": 18.795, "step": 3300 }, { "epoch": 8.0, "eval_accuracy_score": 0.9624356448229835, "eval_f1": 0.6524271844660194, "eval_loss": 0.21822784841060638, "eval_precision": 0.7108603667136812, "eval_recall": 0.6028708133971292, "eval_runtime": 6.7807, "eval_samples_per_second": 148.804, "eval_steps_per_second": 18.73, "step": 3400 }, { "epoch": 8.24, "learning_rate": 3.6274509803921573e-06, "loss": 0.0559, "step": 3500 }, { "epoch": 8.24, "eval_accuracy_score": 0.9631348121782242, "eval_f1": 0.659062103929024, "eval_loss": 0.21273677051067352, "eval_precision": 0.7008086253369272, "eval_recall": 0.6220095693779905, "eval_runtime": 6.7444, "eval_samples_per_second": 149.606, "eval_steps_per_second": 18.831, "step": 3500 }, { "epoch": 8.47, "eval_accuracy_score": 0.9634526155215153, "eval_f1": 0.6608478802992518, "eval_loss": 0.20193149149417877, "eval_precision": 0.6901041666666666, "eval_recall": 0.6339712918660287, "eval_runtime": 8.1777, "eval_samples_per_second": 123.384, "eval_steps_per_second": 15.53, "step": 3600 }, { "epoch": 8.71, "eval_accuracy_score": 0.9634526155215153, "eval_f1": 0.6587942821628341, "eval_loss": 0.20160645246505737, "eval_precision": 0.685640362225097, "eval_recall": 0.6339712918660287, "eval_runtime": 6.7668, "eval_samples_per_second": 149.11, "eval_steps_per_second": 18.768, "step": 3700 }, { "epoch": 8.94, "eval_accuracy_score": 0.9634526155215153, "eval_f1": 0.662553979025293, "eval_loss": 0.20665320754051208, "eval_precision": 0.6840764331210191, "eval_recall": 0.6423444976076556, "eval_runtime": 6.7328, "eval_samples_per_second": 149.863, "eval_steps_per_second": 18.863, "step": 3800 }, { "epoch": 9.18, "eval_accuracy_score": 0.9629441301722494, "eval_f1": 0.6566775244299674, "eval_loss": 0.22287048399448395, "eval_precision": 0.721030042918455, "eval_recall": 0.6028708133971292, "eval_runtime": 6.7851, "eval_samples_per_second": 148.709, "eval_steps_per_second": 18.718, "step": 3900 }, { "epoch": 9.41, "learning_rate": 3.431372549019608e-06, "loss": 0.0459, "step": 4000 }, { "epoch": 9.41, "eval_accuracy_score": 0.9635797368588318, "eval_f1": 0.6574827802128992, "eval_loss": 0.20987075567245483, "eval_precision": 0.6898817345597897, "eval_recall": 0.6279904306220095, "eval_runtime": 6.7469, "eval_samples_per_second": 149.549, "eval_steps_per_second": 18.823, "step": 4000 }, { "epoch": 9.65, "eval_accuracy_score": 0.9628805695035911, "eval_f1": 0.6568690095846645, "eval_loss": 0.22190582752227783, "eval_precision": 0.7050754458161865, "eval_recall": 0.6148325358851675, "eval_runtime": 6.7586, "eval_samples_per_second": 149.292, "eval_steps_per_second": 18.791, "step": 4100 }, { "epoch": 9.88, "eval_accuracy_score": 0.9632619335155406, "eval_f1": 0.6525265127885215, "eval_loss": 0.21028834581375122, "eval_precision": 0.681877444589309, "eval_recall": 0.6255980861244019, "eval_runtime": 6.7583, "eval_samples_per_second": 149.298, "eval_steps_per_second": 18.792, "step": 4200 }, { "epoch": 10.12, "eval_accuracy_score": 0.9640882222080976, "eval_f1": 0.6692111959287532, "eval_loss": 0.2170829027891159, "eval_precision": 0.7146739130434783, "eval_recall": 0.6291866028708134, "eval_runtime": 6.7544, "eval_samples_per_second": 149.383, "eval_steps_per_second": 18.802, "step": 4300 }, { "epoch": 10.35, "eval_accuracy_score": 0.9630712515095659, "eval_f1": 0.6495619524405507, "eval_loss": 0.2193835973739624, "eval_precision": 0.6811023622047244, "eval_recall": 0.6208133971291866, "eval_runtime": 6.7362, "eval_samples_per_second": 149.787, "eval_steps_per_second": 18.853, "step": 4400 }, { "epoch": 10.59, "learning_rate": 3.2352941176470594e-06, "loss": 0.0399, "step": 4500 }, { "epoch": 10.59, "eval_accuracy_score": 0.9634526155215153, "eval_f1": 0.6556543837357053, "eval_loss": 0.21863853931427002, "eval_precision": 0.6991869918699187, "eval_recall": 0.6172248803827751, "eval_runtime": 6.769, "eval_samples_per_second": 149.062, "eval_steps_per_second": 18.762, "step": 4500 }, { "epoch": 10.82, "eval_accuracy_score": 0.9637068581961482, "eval_f1": 0.6624685138539044, "eval_loss": 0.21445031464099884, "eval_precision": 0.699468085106383, "eval_recall": 0.6291866028708134, "eval_runtime": 6.7298, "eval_samples_per_second": 149.93, "eval_steps_per_second": 18.871, "step": 4600 }, { "epoch": 11.06, "eval_accuracy_score": 0.9644695862200471, "eval_f1": 0.6759142496847416, "eval_loss": 0.20991285145282745, "eval_precision": 0.7146666666666667, "eval_recall": 0.6411483253588517, "eval_runtime": 6.734, "eval_samples_per_second": 149.837, "eval_steps_per_second": 18.86, "step": 4700 }, { "epoch": 11.29, "eval_accuracy_score": 0.96364329752749, "eval_f1": 0.6649778340721977, "eval_loss": 0.22495105862617493, "eval_precision": 0.7065948855989233, "eval_recall": 0.6279904306220095, "eval_runtime": 6.7408, "eval_samples_per_second": 149.687, "eval_steps_per_second": 18.841, "step": 4800 }, { "epoch": 11.53, "eval_accuracy_score": 0.9639611008707811, "eval_f1": 0.6670894102726697, "eval_loss": 0.22267203032970428, "eval_precision": 0.7098515519568152, "eval_recall": 0.6291866028708134, "eval_runtime": 6.7689, "eval_samples_per_second": 149.064, "eval_steps_per_second": 18.762, "step": 4900 }, { "epoch": 11.76, "learning_rate": 3.03921568627451e-06, "loss": 0.0368, "step": 5000 }, { "epoch": 11.76, "eval_accuracy_score": 0.9637068581961482, "eval_f1": 0.6588235294117647, "eval_loss": 0.21161217987537384, "eval_precision": 0.6829268292682927, "eval_recall": 0.6363636363636364, "eval_runtime": 6.7536, "eval_samples_per_second": 149.402, "eval_steps_per_second": 18.805, "step": 5000 }, { "epoch": 12.0, "eval_accuracy_score": 0.9625627661603, "eval_f1": 0.6593830334190232, "eval_loss": 0.227540984749794, "eval_precision": 0.7125, "eval_recall": 0.6136363636363636, "eval_runtime": 6.7584, "eval_samples_per_second": 149.295, "eval_steps_per_second": 18.791, "step": 5100 }, { "epoch": 12.24, "eval_accuracy_score": 0.9628805695035911, "eval_f1": 0.6640471512770137, "eval_loss": 0.23519518971443176, "eval_precision": 0.7337192474674384, "eval_recall": 0.6064593301435407, "eval_runtime": 6.7729, "eval_samples_per_second": 148.976, "eval_steps_per_second": 18.751, "step": 5200 }, { "epoch": 12.47, "eval_accuracy_score": 0.9628170088349329, "eval_f1": 0.6679462571976967, "eval_loss": 0.2271033227443695, "eval_precision": 0.7180192572214581, "eval_recall": 0.6244019138755981, "eval_runtime": 6.7726, "eval_samples_per_second": 148.983, "eval_steps_per_second": 18.752, "step": 5300 }, { "epoch": 12.71, "eval_accuracy_score": 0.9630076908409076, "eval_f1": 0.6628643852978454, "eval_loss": 0.22853700816631317, "eval_precision": 0.7048517520215634, "eval_recall": 0.6255980861244019, "eval_runtime": 6.7535, "eval_samples_per_second": 149.405, "eval_steps_per_second": 18.805, "step": 5400 }, { "epoch": 12.94, "learning_rate": 2.843137254901961e-06, "loss": 0.0321, "step": 5500 }, { "epoch": 12.94, "eval_accuracy_score": 0.9631348121782242, "eval_f1": 0.664548919949174, "eval_loss": 0.22333784401416779, "eval_precision": 0.7086720867208672, "eval_recall": 0.6255980861244019, "eval_runtime": 6.7401, "eval_samples_per_second": 149.702, "eval_steps_per_second": 18.843, "step": 5500 }, { "epoch": 13.18, "eval_accuracy_score": 0.9637068581961482, "eval_f1": 0.6705054382597568, "eval_loss": 0.222885861992836, "eval_precision": 0.7207702888583218, "eval_recall": 0.6267942583732058, "eval_runtime": 6.7486, "eval_samples_per_second": 149.513, "eval_steps_per_second": 18.819, "step": 5600 }, { "epoch": 13.41, "eval_accuracy_score": 0.9633254941841988, "eval_f1": 0.6619718309859155, "eval_loss": 0.2285127490758896, "eval_precision": 0.7121212121212122, "eval_recall": 0.618421052631579, "eval_runtime": 6.8129, "eval_samples_per_second": 148.102, "eval_steps_per_second": 18.641, "step": 5700 }, { "epoch": 13.65, "eval_accuracy_score": 0.9644695862200471, "eval_f1": 0.6734177215189874, "eval_loss": 0.22083869576454163, "eval_precision": 0.7150537634408602, "eval_recall": 0.6363636363636364, "eval_runtime": 6.7283, "eval_samples_per_second": 149.964, "eval_steps_per_second": 18.876, "step": 5800 }, { "epoch": 13.88, "eval_accuracy_score": 0.9635161761901735, "eval_f1": 0.6684005201560469, "eval_loss": 0.2334665209054947, "eval_precision": 0.7321937321937322, "eval_recall": 0.6148325358851675, "eval_runtime": 6.7215, "eval_samples_per_second": 150.116, "eval_steps_per_second": 18.895, "step": 5900 }, { "epoch": 14.12, "learning_rate": 2.647058823529412e-06, "loss": 0.0291, "step": 6000 }, { "epoch": 14.12, "eval_accuracy_score": 0.9641517828767558, "eval_f1": 0.663265306122449, "eval_loss": 0.2206926792860031, "eval_precision": 0.7103825136612022, "eval_recall": 0.6220095693779905, "eval_runtime": 6.7314, "eval_samples_per_second": 149.894, "eval_steps_per_second": 18.867, "step": 6000 }, { "epoch": 14.35, "eval_accuracy_score": 0.9650416322379711, "eval_f1": 0.6737633061991233, "eval_loss": 0.21664156019687653, "eval_precision": 0.7069645203679369, "eval_recall": 0.6435406698564593, "eval_runtime": 6.8128, "eval_samples_per_second": 148.104, "eval_steps_per_second": 18.641, "step": 6100 }, { "epoch": 14.59, "eval_accuracy_score": 0.9646602682260217, "eval_f1": 0.6654275092936804, "eval_loss": 0.20899562537670135, "eval_precision": 0.6902313624678663, "eval_recall": 0.6423444976076556, "eval_runtime": 6.7812, "eval_samples_per_second": 148.794, "eval_steps_per_second": 18.728, "step": 6200 }, { "epoch": 14.82, "eval_accuracy_score": 0.9647873895633382, "eval_f1": 0.6766917293233083, "eval_loss": 0.21245865523815155, "eval_precision": 0.7105263157894737, "eval_recall": 0.645933014354067, "eval_runtime": 6.7236, "eval_samples_per_second": 150.069, "eval_steps_per_second": 18.889, "step": 6300 }, { "epoch": 15.06, "eval_accuracy_score": 0.9637704188648064, "eval_f1": 0.6666666666666667, "eval_loss": 0.22959989309310913, "eval_precision": 0.713506139154161, "eval_recall": 0.6255980861244019, "eval_runtime": 6.7691, "eval_samples_per_second": 149.061, "eval_steps_per_second": 18.762, "step": 6400 }, { "epoch": 15.29, "learning_rate": 2.450980392156863e-06, "loss": 0.0251, "step": 6500 }, { "epoch": 15.29, "eval_accuracy_score": 0.9645331468887053, "eval_f1": 0.6733542319749217, "eval_loss": 0.22114437818527222, "eval_precision": 0.7075098814229249, "eval_recall": 0.6423444976076556, "eval_runtime": 6.8495, "eval_samples_per_second": 147.311, "eval_steps_per_second": 18.542, "step": 6500 }, { "epoch": 15.53, "eval_accuracy_score": 0.9640882222080976, "eval_f1": 0.6713197969543148, "eval_loss": 0.22384566068649292, "eval_precision": 0.7148648648648649, "eval_recall": 0.6327751196172249, "eval_runtime": 6.7143, "eval_samples_per_second": 150.277, "eval_steps_per_second": 18.915, "step": 6600 }, { "epoch": 15.76, "eval_accuracy_score": 0.9637068581961482, "eval_f1": 0.6641172721478649, "eval_loss": 0.23098178207874298, "eval_precision": 0.7107776261937244, "eval_recall": 0.6232057416267942, "eval_runtime": 6.7457, "eval_samples_per_second": 149.576, "eval_steps_per_second": 18.827, "step": 6700 }, { "epoch": 16.0, "eval_accuracy_score": 0.9650416322379711, "eval_f1": 0.6762860727728984, "eval_loss": 0.21991874277591705, "eval_precision": 0.7110817941952506, "eval_recall": 0.6447368421052632, "eval_runtime": 6.7686, "eval_samples_per_second": 149.07, "eval_steps_per_second": 18.763, "step": 6800 }, { "epoch": 16.24, "eval_accuracy_score": 0.96364329752749, "eval_f1": 0.6636771300448431, "eval_loss": 0.23369288444519043, "eval_precision": 0.7144827586206897, "eval_recall": 0.6196172248803827, "eval_runtime": 6.8164, "eval_samples_per_second": 148.025, "eval_steps_per_second": 18.631, "step": 6900 }, { "epoch": 16.47, "learning_rate": 2.254901960784314e-06, "loss": 0.0227, "step": 7000 }, { "epoch": 16.47, "eval_accuracy_score": 0.9646602682260217, "eval_f1": 0.6712243629583592, "eval_loss": 0.22149834036827087, "eval_precision": 0.6985769728331177, "eval_recall": 0.645933014354067, "eval_runtime": 6.7644, "eval_samples_per_second": 149.164, "eval_steps_per_second": 18.775, "step": 7000 }, { "epoch": 16.71, "eval_accuracy_score": 0.9645331468887053, "eval_f1": 0.6687422166874221, "eval_loss": 0.2212422788143158, "eval_precision": 0.6974025974025974, "eval_recall": 0.6423444976076556, "eval_runtime": 6.7009, "eval_samples_per_second": 150.576, "eval_steps_per_second": 18.953, "step": 7100 }, { "epoch": 16.94, "eval_accuracy_score": 0.9635161761901735, "eval_f1": 0.6653821451509313, "eval_loss": 0.24178394675254822, "eval_precision": 0.7184466019417476, "eval_recall": 0.6196172248803827, "eval_runtime": 6.7952, "eval_samples_per_second": 148.486, "eval_steps_per_second": 18.69, "step": 7200 }, { "epoch": 17.18, "eval_accuracy_score": 0.9633890548528571, "eval_f1": 0.6675307841866494, "eval_loss": 0.24713467061519623, "eval_precision": 0.7284299858557284, "eval_recall": 0.6160287081339713, "eval_runtime": 6.807, "eval_samples_per_second": 148.229, "eval_steps_per_second": 18.657, "step": 7300 }, { "epoch": 17.41, "eval_accuracy_score": 0.9643424648827306, "eval_f1": 0.670031545741325, "eval_loss": 0.22886203229427338, "eval_precision": 0.7089452603471295, "eval_recall": 0.6351674641148325, "eval_runtime": 6.7775, "eval_samples_per_second": 148.874, "eval_steps_per_second": 18.738, "step": 7400 }, { "epoch": 17.65, "learning_rate": 2.058823529411765e-06, "loss": 0.0197, "step": 7500 }, { "epoch": 17.65, "eval_accuracy_score": 0.9646602682260217, "eval_f1": 0.6753731343283582, "eval_loss": 0.22524945437908173, "eval_precision": 0.7033678756476683, "eval_recall": 0.6495215311004785, "eval_runtime": 6.7338, "eval_samples_per_second": 149.84, "eval_steps_per_second": 18.86, "step": 7500 }, { "epoch": 17.88, "eval_accuracy_score": 0.9633890548528571, "eval_f1": 0.664528543938422, "eval_loss": 0.24701638519763947, "eval_precision": 0.7164591977869986, "eval_recall": 0.6196172248803827, "eval_runtime": 6.7838, "eval_samples_per_second": 148.736, "eval_steps_per_second": 18.721, "step": 7600 }, { "epoch": 18.12, "eval_accuracy_score": 0.9654865569185788, "eval_f1": 0.6825, "eval_loss": 0.22353364527225494, "eval_precision": 0.7146596858638743, "eval_recall": 0.65311004784689, "eval_runtime": 6.7595, "eval_samples_per_second": 149.272, "eval_steps_per_second": 18.788, "step": 7700 }, { "epoch": 18.35, "eval_accuracy_score": 0.9638975402021229, "eval_f1": 0.6590765338393421, "eval_loss": 0.23786970973014832, "eval_precision": 0.6993288590604027, "eval_recall": 0.6232057416267942, "eval_runtime": 6.8141, "eval_samples_per_second": 148.075, "eval_steps_per_second": 18.638, "step": 7800 }, { "epoch": 18.59, "eval_accuracy_score": 0.9644060255513888, "eval_f1": 0.6666666666666667, "eval_loss": 0.23264023661613464, "eval_precision": 0.7014531043593131, "eval_recall": 0.6351674641148325, "eval_runtime": 6.8013, "eval_samples_per_second": 148.353, "eval_steps_per_second": 18.673, "step": 7900 }, { "epoch": 18.82, "learning_rate": 1.8627450980392158e-06, "loss": 0.0183, "step": 8000 }, { "epoch": 18.82, "eval_accuracy_score": 0.9649780715693129, "eval_f1": 0.6724244293645897, "eval_loss": 0.22304123640060425, "eval_precision": 0.6942675159235668, "eval_recall": 0.6519138755980861, "eval_runtime": 6.7426, "eval_samples_per_second": 149.646, "eval_steps_per_second": 18.835, "step": 8000 }, { "epoch": 19.06, "eval_accuracy_score": 0.9643424648827306, "eval_f1": 0.6683480453972257, "eval_loss": 0.2350449413061142, "eval_precision": 0.7066666666666667, "eval_recall": 0.6339712918660287, "eval_runtime": 6.8057, "eval_samples_per_second": 148.259, "eval_steps_per_second": 18.661, "step": 8100 }, { "epoch": 19.29, "eval_accuracy_score": 0.9652323142439458, "eval_f1": 0.6790582403965303, "eval_loss": 0.226871520280838, "eval_precision": 0.7043701799485861, "eval_recall": 0.6555023923444976, "eval_runtime": 6.7483, "eval_samples_per_second": 149.519, "eval_steps_per_second": 18.819, "step": 8200 }, { "epoch": 19.53, "eval_accuracy_score": 0.96472382889468, "eval_f1": 0.6683354192740926, "eval_loss": 0.23186342418193817, "eval_precision": 0.7007874015748031, "eval_recall": 0.638755980861244, "eval_runtime": 6.7632, "eval_samples_per_second": 149.19, "eval_steps_per_second": 18.778, "step": 8300 }, { "epoch": 19.76, "eval_accuracy_score": 0.9645967075573635, "eval_f1": 0.6712933753943218, "eval_loss": 0.2337142825126648, "eval_precision": 0.7102803738317757, "eval_recall": 0.6363636363636364, "eval_runtime": 6.7451, "eval_samples_per_second": 149.591, "eval_steps_per_second": 18.829, "step": 8400 }, { "epoch": 20.0, "learning_rate": 1.6666666666666667e-06, "loss": 0.0162, "step": 8500 }, { "epoch": 20.0, "eval_accuracy_score": 0.9647873895633382, "eval_f1": 0.6751430387794024, "eval_loss": 0.2389359027147293, "eval_precision": 0.7204884667571235, "eval_recall": 0.6351674641148325, "eval_runtime": 6.7503, "eval_samples_per_second": 149.474, "eval_steps_per_second": 18.814, "step": 8500 }, { "epoch": 20.24, "eval_accuracy_score": 0.9638975402021229, "eval_f1": 0.6709677419354839, "eval_loss": 0.25359493494033813, "eval_precision": 0.7282913165266106, "eval_recall": 0.6220095693779905, "eval_runtime": 6.7422, "eval_samples_per_second": 149.655, "eval_steps_per_second": 18.837, "step": 8600 }, { "epoch": 20.47, "eval_accuracy_score": 0.964215343545414, "eval_f1": 0.6709346991037132, "eval_loss": 0.24693100154399872, "eval_precision": 0.721763085399449, "eval_recall": 0.6267942583732058, "eval_runtime": 6.7296, "eval_samples_per_second": 149.934, "eval_steps_per_second": 18.872, "step": 8700 }, { "epoch": 20.71, "eval_accuracy_score": 0.9637704188648064, "eval_f1": 0.6687938736439056, "eval_loss": 0.2458009421825409, "eval_precision": 0.7168262653898769, "eval_recall": 0.6267942583732058, "eval_runtime": 6.7627, "eval_samples_per_second": 149.201, "eval_steps_per_second": 18.78, "step": 8800 }, { "epoch": 20.94, "eval_accuracy_score": 0.9648509502319964, "eval_f1": 0.676304211187932, "eval_loss": 0.23430827260017395, "eval_precision": 0.7125827814569536, "eval_recall": 0.6435406698564593, "eval_runtime": 6.7289, "eval_samples_per_second": 149.951, "eval_steps_per_second": 18.874, "step": 8900 }, { "epoch": 21.18, "learning_rate": 1.4705882352941177e-06, "loss": 0.0149, "step": 9000 }, { "epoch": 21.18, "eval_accuracy_score": 0.9651687535752876, "eval_f1": 0.6788413098236775, "eval_loss": 0.23078210651874542, "eval_precision": 0.7167553191489362, "eval_recall": 0.6447368421052632, "eval_runtime": 6.7181, "eval_samples_per_second": 150.19, "eval_steps_per_second": 18.904, "step": 9000 } ], "max_steps": 12750, "num_train_epochs": 30, "total_flos": 4695577703714304.0, "trial_name": null, "trial_params": null }