diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,409 +1,3929 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 20.0, + "epoch": 100.0, "eval_steps": 500, - "global_step": 2120, + "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, - "grad_norm": 2.7167601585388184, - "learning_rate": 4.75e-05, - "loss": 0.3551, + "grad_norm": 3.8788857460021973, + "learning_rate": 4.9500000000000004e-05, + "loss": 0.3599, "step": 106 }, { "epoch": 1.0, - "eval_accuracy": 0.9413572343149808, - "eval_f1": 0.764857881136951, - "eval_loss": 0.18727199733257294, - "eval_precision": 0.6788990825688074, - "eval_recall": 0.8757396449704142, - "eval_runtime": 0.7255, - "eval_samples_per_second": 257.747, - "eval_steps_per_second": 4.135, + "eval_LOCATION_f1": 0.8356164383561644, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7922077922077922, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.512396694214876, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.49206349206349204, + "eval_ORGANIZATION_recall": 0.5344827586206896, + "eval_PERSON_f1": 0.8625, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8214285714285714, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.6666666666666666, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.6363636363636364, + "eval_QUANTITY_recall": 0.7, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.1317242681980133, + "eval_overall_accuracy": 0.9569782330345711, + "eval_overall_f1": 0.7791842475386779, + "eval_overall_precision": 0.7426273458445041, + "eval_overall_recall": 0.8195266272189349, + "eval_runtime": 0.659, + "eval_samples_per_second": 283.783, + "eval_steps_per_second": 4.553, "step": 106 }, { "epoch": 2.0, - "grad_norm": 0.8801630139350891, - "learning_rate": 4.5e-05, - "loss": 0.1199, + "grad_norm": 2.0066733360290527, + "learning_rate": 4.9e-05, + "loss": 0.1201, "step": 212 }, { "epoch": 2.0, - "eval_accuracy": 0.9610755441741358, - "eval_f1": 0.8164383561643835, - "eval_loss": 0.1307690292596817, - "eval_precision": 0.7602040816326531, - "eval_recall": 0.8816568047337278, - "eval_runtime": 0.6806, - "eval_samples_per_second": 274.744, - "eval_steps_per_second": 4.408, + "eval_LOCATION_f1": 0.8053691275167786, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.75, + "eval_LOCATION_recall": 0.8695652173913043, + "eval_ORGANIZATION_f1": 0.7230769230769231, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6527777777777778, + "eval_ORGANIZATION_recall": 0.8103448275862069, + "eval_PERSON_f1": 0.8860759493670887, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8536585365853658, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.6, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.525, + "eval_QUANTITY_recall": 0.7, + "eval_TIME_f1": 0.75, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.6857142857142857, + "eval_TIME_recall": 0.8275862068965517, + "eval_loss": 0.14421768486499786, + "eval_overall_accuracy": 0.9580025608194622, + "eval_overall_f1": 0.8010973936899862, + "eval_overall_precision": 0.7468030690537084, + "eval_overall_recall": 0.863905325443787, + "eval_runtime": 0.6779, + "eval_samples_per_second": 275.835, + "eval_steps_per_second": 4.425, "step": 212 }, { "epoch": 3.0, - "grad_norm": 6.373292922973633, - "learning_rate": 4.25e-05, - "loss": 0.0746, + "grad_norm": 4.826297760009766, + "learning_rate": 4.85e-05, + "loss": 0.0789, "step": 318 }, { "epoch": 3.0, - "eval_accuracy": 0.9618437900128041, - "eval_f1": 0.8238557558945908, - "eval_loss": 0.13828597962856293, - "eval_precision": 0.7754569190600522, - "eval_recall": 0.878698224852071, - "eval_runtime": 0.6892, - "eval_samples_per_second": 271.342, - "eval_steps_per_second": 4.353, + "eval_LOCATION_f1": 0.8051948051948051, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7294117647058823, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.7218045112781956, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.64, + "eval_ORGANIZATION_recall": 0.8275862068965517, + "eval_PERSON_f1": 0.852760736196319, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.7988505747126436, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8307692307692307, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7714285714285715, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8813559322033899, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8666666666666667, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.15757465362548828, + "eval_overall_accuracy": 0.954673495518566, + "eval_overall_f1": 0.819538670284939, + "eval_overall_precision": 0.7568922305764411, + "eval_overall_recall": 0.893491124260355, + "eval_runtime": 0.7577, + "eval_samples_per_second": 246.801, + "eval_steps_per_second": 3.959, "step": 318 }, { "epoch": 4.0, - "grad_norm": 1.9436761140823364, - "learning_rate": 4e-05, + "grad_norm": 1.5358341932296753, + "learning_rate": 4.8e-05, "loss": 0.0497, "step": 424 }, { "epoch": 4.0, - "eval_accuracy": 0.9554417413572344, - "eval_f1": 0.8183118741058654, - "eval_loss": 0.17165431380271912, - "eval_precision": 0.7922437673130194, - "eval_recall": 0.8461538461538461, - "eval_runtime": 0.7007, - "eval_samples_per_second": 266.88, - "eval_steps_per_second": 4.281, + "eval_LOCATION_f1": 0.8243243243243245, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7721518987341772, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.765625, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7, + "eval_ORGANIZATION_recall": 0.8448275862068966, + "eval_PERSON_f1": 0.8980891719745223, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8703703703703703, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8125, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7647058823529411, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.75, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.6857142857142857, + "eval_TIME_recall": 0.8275862068965517, + "eval_loss": 0.15764029324054718, + "eval_overall_accuracy": 0.9628681177976952, + "eval_overall_f1": 0.8384401114206129, + "eval_overall_precision": 0.7921052631578948, + "eval_overall_recall": 0.8905325443786982, + "eval_runtime": 0.6908, + "eval_samples_per_second": 270.686, + "eval_steps_per_second": 4.343, "step": 424 }, { "epoch": 5.0, - "grad_norm": 0.7730250954627991, - "learning_rate": 3.7500000000000003e-05, - "loss": 0.0289, + "grad_norm": 0.8067348003387451, + "learning_rate": 4.75e-05, + "loss": 0.0304, "step": 530 }, { "epoch": 5.0, - "eval_accuracy": 0.9620998719590269, - "eval_f1": 0.8389830508474576, - "eval_loss": 0.17060597240924835, - "eval_precision": 0.8027027027027027, - "eval_recall": 0.878698224852071, - "eval_runtime": 0.7043, - "eval_samples_per_second": 265.498, - "eval_steps_per_second": 4.259, + "eval_LOCATION_f1": 0.8591549295774648, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8356164383561644, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.6554621848739496, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.639344262295082, + "eval_ORGANIZATION_recall": 0.6724137931034483, + "eval_PERSON_f1": 0.8681672025723474, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8490566037735849, + "eval_PERSON_recall": 0.8881578947368421, + "eval_QUANTITY_f1": 0.8125, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7647058823529411, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8620689655172413, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8620689655172413, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.18078266084194183, + "eval_overall_accuracy": 0.9603072983354674, + "eval_overall_f1": 0.8242074927953891, + "eval_overall_precision": 0.8033707865168539, + "eval_overall_recall": 0.8461538461538461, + "eval_runtime": 0.7144, + "eval_samples_per_second": 261.763, + "eval_steps_per_second": 4.199, "step": 530 }, { "epoch": 6.0, - "grad_norm": 1.2929595708847046, - "learning_rate": 3.5e-05, - "loss": 0.023, + "grad_norm": 2.896883010864258, + "learning_rate": 4.7e-05, + "loss": 0.0258, "step": 636 }, { "epoch": 6.0, - "eval_accuracy": 0.9585147247119078, - "eval_f1": 0.8188105117565698, - "eval_loss": 0.19288022816181183, - "eval_precision": 0.7688311688311689, - "eval_recall": 0.8757396449704142, - "eval_runtime": 0.7437, - "eval_samples_per_second": 251.457, - "eval_steps_per_second": 4.034, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7590361445783133, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.6166666666666667, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.5967741935483871, + "eval_ORGANIZATION_recall": 0.6379310344827587, + "eval_PERSON_f1": 0.8867313915857605, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8726114649681529, + "eval_PERSON_recall": 0.9013157894736842, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8253968253968255, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7647058823529411, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.18976914882659912, + "eval_overall_accuracy": 0.9590268886043534, + "eval_overall_f1": 0.8175388967468176, + "eval_overall_precision": 0.7831978319783198, + "eval_overall_recall": 0.8550295857988166, + "eval_runtime": 0.7567, + "eval_samples_per_second": 247.118, + "eval_steps_per_second": 3.964, "step": 636 }, { "epoch": 7.0, - "grad_norm": 0.03867774084210396, - "learning_rate": 3.2500000000000004e-05, - "loss": 0.0161, + "grad_norm": 0.08857329934835434, + "learning_rate": 4.6500000000000005e-05, + "loss": 0.0151, "step": 742 }, { "epoch": 7.0, - "eval_accuracy": 0.9539052496798975, - "eval_f1": 0.82336578581363, - "eval_loss": 0.24569807946681976, - "eval_precision": 0.7769028871391076, - "eval_recall": 0.8757396449704142, - "eval_runtime": 0.7594, - "eval_samples_per_second": 246.235, - "eval_steps_per_second": 3.95, + "eval_LOCATION_f1": 0.84, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7777777777777778, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.6491228070175439, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6607142857142857, + "eval_ORGANIZATION_recall": 0.6379310344827587, + "eval_PERSON_f1": 0.8789808917197451, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8518518518518519, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.84375, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7941176470588235, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.7692307692307692, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.6944444444444444, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.22696857154369354, + "eval_overall_accuracy": 0.9587708066581306, + "eval_overall_f1": 0.8203677510608204, + "eval_overall_precision": 0.7859078590785907, + "eval_overall_recall": 0.8579881656804734, + "eval_runtime": 0.7647, + "eval_samples_per_second": 244.536, + "eval_steps_per_second": 3.923, "step": 742 }, { "epoch": 8.0, - "grad_norm": 0.1270778626203537, - "learning_rate": 3e-05, - "loss": 0.0106, + "grad_norm": 0.24211041629314423, + "learning_rate": 4.600000000000001e-05, + "loss": 0.0124, "step": 848 }, { "epoch": 8.0, - "eval_accuracy": 0.9572343149807938, - "eval_f1": 0.8347338935574229, - "eval_loss": 0.24495673179626465, - "eval_precision": 0.7925531914893617, - "eval_recall": 0.8816568047337278, - "eval_runtime": 0.7817, - "eval_samples_per_second": 239.211, - "eval_steps_per_second": 3.838, + "eval_LOCATION_f1": 0.8493150684931507, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.706766917293233, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6266666666666667, + "eval_ORGANIZATION_recall": 0.8103448275862069, + "eval_PERSON_f1": 0.8761904761904762, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8466257668711656, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.2596437335014343, + "eval_overall_accuracy": 0.9569782330345711, + "eval_overall_f1": 0.83008356545961, + "eval_overall_precision": 0.7842105263157895, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.7892, + "eval_samples_per_second": 236.961, + "eval_steps_per_second": 3.802, "step": 848 }, { "epoch": 9.0, - "grad_norm": 1.8804335594177246, - "learning_rate": 2.7500000000000004e-05, - "loss": 0.0065, + "grad_norm": 0.5304147005081177, + "learning_rate": 4.55e-05, + "loss": 0.0088, "step": 954 }, { "epoch": 9.0, - "eval_accuracy": 0.9628681177976952, - "eval_f1": 0.8551336146272854, - "eval_loss": 0.23150116205215454, - "eval_precision": 0.8150134048257373, - "eval_recall": 0.8994082840236687, - "eval_runtime": 0.8068, - "eval_samples_per_second": 231.794, - "eval_steps_per_second": 3.719, + "eval_LOCATION_f1": 0.8571428571428572, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8076923076923077, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7401574803149606, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6811594202898551, + "eval_ORGANIZATION_recall": 0.8103448275862069, + "eval_PERSON_f1": 0.8535825545171339, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8106508875739645, + "eval_PERSON_recall": 0.9013157894736842, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8333333333333334, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8064516129032258, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.26296016573905945, + "eval_overall_accuracy": 0.9562099871959027, + "eval_overall_f1": 0.83008356545961, + "eval_overall_precision": 0.7842105263157895, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8059, + "eval_samples_per_second": 232.037, + "eval_steps_per_second": 3.723, "step": 954 }, { "epoch": 10.0, - "grad_norm": 2.087066888809204, - "learning_rate": 2.5e-05, - "loss": 0.0053, + "grad_norm": 1.2787593603134155, + "learning_rate": 4.5e-05, + "loss": 0.0083, "step": 1060 }, { "epoch": 10.0, - "eval_accuracy": 0.9626120358514725, - "eval_f1": 0.84822695035461, - "eval_loss": 0.2372884303331375, - "eval_precision": 0.8147138964577657, - "eval_recall": 0.8846153846153846, - "eval_runtime": 0.7914, - "eval_samples_per_second": 236.29, - "eval_steps_per_second": 3.791, + "eval_LOCATION_f1": 0.8513513513513514, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7974683544303798, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7703703703703704, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6753246753246753, + "eval_ORGANIZATION_recall": 0.896551724137931, + "eval_PERSON_f1": 0.9079365079365079, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8773006134969326, + "eval_PERSON_recall": 0.9407894736842105, + "eval_QUANTITY_f1": 0.7500000000000001, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7058823529411765, + "eval_QUANTITY_recall": 0.8, + "eval_TIME_f1": 0.8135593220338982, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8, + "eval_TIME_recall": 0.8275862068965517, + "eval_loss": 0.23285891115665436, + "eval_overall_accuracy": 0.963124199743918, + "eval_overall_f1": 0.8488210818307906, + "eval_overall_precision": 0.7989556135770235, + "eval_overall_recall": 0.9053254437869822, + "eval_runtime": 0.8566, + "eval_samples_per_second": 218.314, + "eval_steps_per_second": 3.502, "step": 1060 }, { "epoch": 11.0, - "grad_norm": 0.011662549339234829, - "learning_rate": 2.25e-05, - "loss": 0.004, + "grad_norm": 2.0766656398773193, + "learning_rate": 4.4500000000000004e-05, + "loss": 0.0088, "step": 1166 }, { "epoch": 11.0, - "eval_accuracy": 0.9638924455825865, - "eval_f1": 0.855507868383405, - "eval_loss": 0.2421087622642517, - "eval_precision": 0.8282548476454293, - "eval_recall": 0.8846153846153846, - "eval_runtime": 0.8007, - "eval_samples_per_second": 233.559, - "eval_steps_per_second": 3.747, + "eval_LOCATION_f1": 0.8571428571428572, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8076923076923077, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7154471544715447, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.676923076923077, + "eval_ORGANIZATION_recall": 0.7586206896551724, + "eval_PERSON_f1": 0.875, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8333333333333334, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.78125, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7352941176470589, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.23979602754116058, + "eval_overall_accuracy": 0.9610755441741358, + "eval_overall_f1": 0.8324022346368716, + "eval_overall_precision": 0.7883597883597884, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.7972, + "eval_samples_per_second": 234.561, + "eval_steps_per_second": 3.763, "step": 1166 }, { "epoch": 12.0, - "grad_norm": 0.012989125214517117, - "learning_rate": 2e-05, - "loss": 0.003, + "grad_norm": 0.004628497175872326, + "learning_rate": 4.4000000000000006e-05, + "loss": 0.007, "step": 1272 }, { "epoch": 12.0, - "eval_accuracy": 0.9620998719590269, - "eval_f1": 0.8499298737727911, - "eval_loss": 0.25717440247535706, - "eval_precision": 0.808, - "eval_recall": 0.8964497041420119, - "eval_runtime": 0.7997, - "eval_samples_per_second": 233.831, - "eval_steps_per_second": 3.751, + "eval_LOCATION_f1": 0.8243243243243245, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7721518987341772, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.7704918032786885, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.734375, + "eval_ORGANIZATION_recall": 0.8103448275862069, + "eval_PERSON_f1": 0.8758169934640522, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8701298701298701, + "eval_PERSON_recall": 0.881578947368421, + "eval_QUANTITY_f1": 0.7936507936507938, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7575757575757576, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8813559322033899, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8666666666666667, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.23579084873199463, + "eval_overall_accuracy": 0.9623559539052496, + "eval_overall_f1": 0.8395415472779371, + "eval_overall_precision": 0.8138888888888889, + "eval_overall_recall": 0.8668639053254438, + "eval_runtime": 0.8766, + "eval_samples_per_second": 213.313, + "eval_steps_per_second": 3.422, "step": 1272 }, { "epoch": 13.0, - "grad_norm": 0.0042635309509932995, - "learning_rate": 1.75e-05, - "loss": 0.0027, + "grad_norm": 0.023974481970071793, + "learning_rate": 4.35e-05, + "loss": 0.0061, "step": 1378 }, { "epoch": 13.0, - "eval_accuracy": 0.9615877080665813, - "eval_f1": 0.8502824858757062, - "eval_loss": 0.2515665292739868, - "eval_precision": 0.8135135135135135, - "eval_recall": 0.8905325443786982, - "eval_runtime": 0.8271, - "eval_samples_per_second": 226.082, - "eval_steps_per_second": 3.627, + "eval_LOCATION_f1": 0.851063829787234, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8333333333333334, + "eval_LOCATION_recall": 0.8695652173913043, + "eval_ORGANIZATION_f1": 0.6019417475728155, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6888888888888889, + "eval_ORGANIZATION_recall": 0.5344827586206896, + "eval_PERSON_f1": 0.8932038834951456, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8789808917197452, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7428571428571429, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8813559322033899, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8666666666666667, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.24468651413917542, + "eval_overall_accuracy": 0.9613316261203585, + "eval_overall_f1": 0.8301329394387003, + "eval_overall_precision": 0.8289085545722714, + "eval_overall_recall": 0.8313609467455622, + "eval_runtime": 0.8154, + "eval_samples_per_second": 229.344, + "eval_steps_per_second": 3.679, "step": 1378 }, { "epoch": 14.0, - "grad_norm": 0.009077166207134724, - "learning_rate": 1.5e-05, - "loss": 0.0012, + "grad_norm": 0.16095533967018127, + "learning_rate": 4.3e-05, + "loss": 0.0073, "step": 1484 }, { "epoch": 14.0, - "eval_accuracy": 0.9649167733674776, - "eval_f1": 0.8523206751054854, - "eval_loss": 0.26363739371299744, - "eval_precision": 0.8123324396782842, - "eval_recall": 0.8964497041420119, - "eval_runtime": 0.8031, - "eval_samples_per_second": 232.86, - "eval_steps_per_second": 3.736, + "eval_LOCATION_f1": 0.8551724137931034, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8157894736842105, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.7500000000000001, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7258064516129032, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.8996763754045308, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8853503184713376, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8307692307692307, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7714285714285715, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.23856018483638763, + "eval_overall_accuracy": 0.9641485275288092, + "eval_overall_f1": 0.855507868383405, + "eval_overall_precision": 0.8282548476454293, + "eval_overall_recall": 0.8846153846153846, + "eval_runtime": 0.7969, + "eval_samples_per_second": 234.66, + "eval_steps_per_second": 3.765, "step": 1484 }, { "epoch": 15.0, - "grad_norm": 0.011607971042394638, - "learning_rate": 1.25e-05, - "loss": 0.002, + "grad_norm": 3.3597922325134277, + "learning_rate": 4.25e-05, + "loss": 0.0046, "step": 1590 }, { "epoch": 15.0, - "eval_accuracy": 0.9626120358514725, - "eval_f1": 0.847887323943662, - "eval_loss": 0.26717498898506165, - "eval_precision": 0.8091397849462365, - "eval_recall": 0.8905325443786982, - "eval_runtime": 0.8047, - "eval_samples_per_second": 232.386, - "eval_steps_per_second": 3.728, + "eval_LOCATION_f1": 0.8493150684931507, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.75, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6857142857142857, + "eval_ORGANIZATION_recall": 0.8275862068965517, + "eval_PERSON_f1": 0.9055374592833876, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.896774193548387, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8571428571428572, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8181818181818182, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.23872800171375275, + "eval_overall_accuracy": 0.9651728553137003, + "eval_overall_f1": 0.8579545454545454, + "eval_overall_precision": 0.825136612021858, + "eval_overall_recall": 0.893491124260355, + "eval_runtime": 0.8079, + "eval_samples_per_second": 231.459, + "eval_steps_per_second": 3.713, "step": 1590 }, { "epoch": 16.0, - "grad_norm": 12.164788246154785, - "learning_rate": 1e-05, - "loss": 0.0012, + "grad_norm": 4.114704608917236, + "learning_rate": 4.2e-05, + "loss": 0.003, "step": 1696 }, { "epoch": 16.0, - "eval_accuracy": 0.9633802816901409, - "eval_f1": 0.8486562942008485, - "eval_loss": 0.26104938983917236, - "eval_precision": 0.8130081300813008, - "eval_recall": 0.8875739644970414, - "eval_runtime": 0.8077, - "eval_samples_per_second": 231.527, - "eval_steps_per_second": 3.714, + "eval_LOCATION_f1": 0.8493150684931507, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.6363636363636364, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6730769230769231, + "eval_ORGANIZATION_recall": 0.603448275862069, + "eval_PERSON_f1": 0.9042904290429044, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.9072847682119205, + "eval_PERSON_recall": 0.9013157894736842, + "eval_QUANTITY_f1": 0.8571428571428572, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8181818181818182, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.847457627118644, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8333333333333334, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.2643202841281891, + "eval_overall_accuracy": 0.9610755441741358, + "eval_overall_f1": 0.8399412628487519, + "eval_overall_precision": 0.8338192419825073, + "eval_overall_recall": 0.8461538461538461, + "eval_runtime": 0.7994, + "eval_samples_per_second": 233.932, + "eval_steps_per_second": 3.753, "step": 1696 }, { "epoch": 17.0, - "grad_norm": 0.011607704684138298, - "learning_rate": 7.5e-06, - "loss": 0.001, + "grad_norm": 0.06794843822717667, + "learning_rate": 4.15e-05, + "loss": 0.0027, "step": 1802 }, { "epoch": 17.0, - "eval_accuracy": 0.963124199743918, - "eval_f1": 0.8579545454545454, - "eval_loss": 0.2693929374217987, - "eval_precision": 0.825136612021858, - "eval_recall": 0.893491124260355, - "eval_runtime": 0.8045, - "eval_samples_per_second": 232.444, - "eval_steps_per_second": 3.729, + "eval_LOCATION_f1": 0.8724832214765101, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8125, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7538461538461538, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6805555555555556, + "eval_ORGANIZATION_recall": 0.8448275862068966, + "eval_PERSON_f1": 0.8701298701298701, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8589743589743589, + "eval_PERSON_recall": 0.881578947368421, + "eval_QUANTITY_f1": 0.84375, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7941176470588235, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.279176265001297, + "eval_overall_accuracy": 0.9613316261203585, + "eval_overall_f1": 0.8466947960618846, + "eval_overall_precision": 0.806970509383378, + "eval_overall_recall": 0.8905325443786982, + "eval_runtime": 0.8067, + "eval_samples_per_second": 231.813, + "eval_steps_per_second": 3.719, "step": 1802 }, { "epoch": 18.0, - "grad_norm": 0.006694562267512083, - "learning_rate": 5e-06, - "loss": 0.0012, + "grad_norm": 0.005153521429747343, + "learning_rate": 4.1e-05, + "loss": 0.0037, "step": 1908 }, { "epoch": 18.0, - "eval_accuracy": 0.9626120358514725, - "eval_f1": 0.8579465541490858, - "eval_loss": 0.2814978361129761, - "eval_precision": 0.8176943699731903, - "eval_recall": 0.9023668639053254, - "eval_runtime": 0.8078, - "eval_samples_per_second": 231.481, - "eval_steps_per_second": 3.714, + "eval_LOCATION_f1": 0.8366013071895425, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7619047619047619, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7154471544715447, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.676923076923077, + "eval_ORGANIZATION_recall": 0.7586206896551724, + "eval_PERSON_f1": 0.8945686900958467, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8695652173913043, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8571428571428572, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8181818181818182, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.27270039916038513, + "eval_overall_accuracy": 0.9620998719590269, + "eval_overall_f1": 0.8443197755960729, + "eval_overall_precision": 0.8026666666666666, + "eval_overall_recall": 0.8905325443786982, + "eval_runtime": 0.8021, + "eval_samples_per_second": 233.132, + "eval_steps_per_second": 3.74, "step": 1908 }, { "epoch": 19.0, - "grad_norm": 0.025878561660647392, - "learning_rate": 2.5e-06, - "loss": 0.0012, + "grad_norm": 0.6481520533561707, + "learning_rate": 4.05e-05, + "loss": 0.0046, "step": 2014 }, { "epoch": 19.0, - "eval_accuracy": 0.9628681177976952, - "eval_f1": 0.8567375886524823, - "eval_loss": 0.2722916901111603, - "eval_precision": 0.8228882833787466, - "eval_recall": 0.893491124260355, - "eval_runtime": 0.8081, - "eval_samples_per_second": 231.404, - "eval_steps_per_second": 3.712, + "eval_LOCATION_f1": 0.8378378378378378, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7848101265822784, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.7258064516129032, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6818181818181818, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.9155844155844156, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.9038461538461539, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8571428571428572, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8181818181818182, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8620689655172413, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8620689655172413, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.24588538706302643, + "eval_overall_accuracy": 0.9636363636363636, + "eval_overall_f1": 0.855920114122682, + "eval_overall_precision": 0.8264462809917356, + "eval_overall_recall": 0.8875739644970414, + "eval_runtime": 0.8194, + "eval_samples_per_second": 228.23, + "eval_steps_per_second": 3.661, "step": 2014 }, { "epoch": 20.0, - "grad_norm": 0.002320911968126893, - "learning_rate": 0.0, - "loss": 0.0008, + "grad_norm": 0.020622072741389275, + "learning_rate": 4e-05, + "loss": 0.0048, "step": 2120 }, { "epoch": 20.0, - "eval_accuracy": 0.963124199743918, - "eval_f1": 0.8583569405099151, - "eval_loss": 0.2749256491661072, - "eval_precision": 0.8233695652173914, - "eval_recall": 0.8964497041420119, - "eval_runtime": 0.8093, - "eval_samples_per_second": 231.054, - "eval_steps_per_second": 3.707, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7590361445783133, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7317073170731708, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6923076923076923, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.9003215434083601, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8805031446540881, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8571428571428572, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8181818181818182, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8125, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7428571428571429, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2616201937198639, + "eval_overall_accuracy": 0.9613316261203585, + "eval_overall_f1": 0.8443197755960729, + "eval_overall_precision": 0.8026666666666666, + "eval_overall_recall": 0.8905325443786982, + "eval_runtime": 0.8054, + "eval_samples_per_second": 232.17, + "eval_steps_per_second": 3.725, "step": 2120 }, { - "epoch": 20.0, - "step": 2120, - "total_flos": 896507603456604.0, - "train_loss": 0.03541206091572091, - "train_runtime": 493.9256, - "train_samples_per_second": 68.31, - "train_steps_per_second": 4.292 + "epoch": 21.0, + "grad_norm": 3.6123130321502686, + "learning_rate": 3.9500000000000005e-05, + "loss": 0.0047, + "step": 2226 + }, + { + "epoch": 21.0, + "eval_LOCATION_f1": 0.8666666666666666, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8024691358024691, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.736, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6865671641791045, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.8932038834951456, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8789808917197452, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8307692307692308, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.75, + "eval_TIME_recall": 0.9310344827586207, + "eval_loss": 0.24132052063941956, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.848314606741573, + "eval_overall_precision": 0.8074866310160428, + "eval_overall_recall": 0.893491124260355, + "eval_runtime": 0.8121, + "eval_samples_per_second": 230.255, + "eval_steps_per_second": 3.694, + "step": 2226 + }, + { + "epoch": 22.0, + "grad_norm": 0.009204844012856483, + "learning_rate": 3.9000000000000006e-05, + "loss": 0.0041, + "step": 2332 + }, + { + "epoch": 22.0, + "eval_LOCATION_f1": 0.8476821192052981, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7804878048780488, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7384615384615385, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6666666666666666, + "eval_ORGANIZATION_recall": 0.8275862068965517, + "eval_PERSON_f1": 0.9032258064516129, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8860759493670886, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.78125, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7352941176470589, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8125, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7428571428571429, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2953908145427704, + "eval_overall_accuracy": 0.9620998719590269, + "eval_overall_f1": 0.8428372739916552, + "eval_overall_precision": 0.7952755905511811, + "eval_overall_recall": 0.8964497041420119, + "eval_runtime": 0.8088, + "eval_samples_per_second": 231.216, + "eval_steps_per_second": 3.709, + "step": 2332 + }, + { + "epoch": 23.0, + "grad_norm": 0.007008604239672422, + "learning_rate": 3.85e-05, + "loss": 0.0034, + "step": 2438 + }, + { + "epoch": 23.0, + "eval_LOCATION_f1": 0.8435374149659864, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.765625, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7, + "eval_ORGANIZATION_recall": 0.8448275862068966, + "eval_PERSON_f1": 0.9131832797427653, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8930817610062893, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.819672131147541, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8064516129032258, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8125, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7428571428571429, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.26445022225379944, + "eval_overall_accuracy": 0.9661971830985916, + "eval_overall_f1": 0.8551336146272854, + "eval_overall_precision": 0.8150134048257373, + "eval_overall_recall": 0.8994082840236687, + "eval_runtime": 0.797, + "eval_samples_per_second": 234.637, + "eval_steps_per_second": 3.764, + "step": 2438 + }, + { + "epoch": 24.0, + "grad_norm": 0.31136611104011536, + "learning_rate": 3.8e-05, + "loss": 0.0021, + "step": 2544 + }, + { + "epoch": 24.0, + "eval_LOCATION_f1": 0.8493150684931507, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.7874015748031497, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7246376811594203, + "eval_ORGANIZATION_recall": 0.8620689655172413, + "eval_PERSON_f1": 0.9067524115755626, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8867924528301887, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8135593220338982, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8275862068965517, + "eval_QUANTITY_recall": 0.8, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.27145740389823914, + "eval_overall_accuracy": 0.9654289372599232, + "eval_overall_f1": 0.8595744680851063, + "eval_overall_precision": 0.8256130790190735, + "eval_overall_recall": 0.8964497041420119, + "eval_runtime": 0.8132, + "eval_samples_per_second": 229.963, + "eval_steps_per_second": 3.689, + "step": 2544 + }, + { + "epoch": 25.0, + "grad_norm": 0.07211441546678543, + "learning_rate": 3.7500000000000003e-05, + "loss": 0.0022, + "step": 2650 + }, + { + "epoch": 25.0, + "eval_LOCATION_f1": 0.8551724137931034, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8157894736842105, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.7500000000000001, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7258064516129032, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.9084967320261438, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.9025974025974026, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.26712566614151, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.8546762589928059, + "eval_overall_precision": 0.8319327731092437, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.8059, + "eval_samples_per_second": 232.043, + "eval_steps_per_second": 3.723, + "step": 2650 + }, + { + "epoch": 26.0, + "grad_norm": 6.344851970672607, + "learning_rate": 3.7e-05, + "loss": 0.0021, + "step": 2756 + }, + { + "epoch": 26.0, + "eval_LOCATION_f1": 0.8311688311688311, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7529411764705882, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7419354838709677, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.696969696969697, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8333333333333334, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8333333333333334, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.30937761068344116, + "eval_overall_accuracy": 0.9623559539052496, + "eval_overall_f1": 0.8486562942008485, + "eval_overall_precision": 0.8130081300813008, + "eval_overall_recall": 0.8875739644970414, + "eval_runtime": 0.8324, + "eval_samples_per_second": 224.639, + "eval_steps_per_second": 3.604, + "step": 2756 + }, + { + "epoch": 27.0, + "grad_norm": 0.9656301736831665, + "learning_rate": 3.65e-05, + "loss": 0.0033, + "step": 2862 + }, + { + "epoch": 27.0, + "eval_LOCATION_f1": 0.8299319727891156, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.782051282051282, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.7603305785123967, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7301587301587301, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.9137380191693291, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8881987577639752, + "eval_PERSON_recall": 0.9407894736842105, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8253968253968255, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7647058823529411, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2710714638233185, + "eval_overall_accuracy": 0.9651728553137003, + "eval_overall_f1": 0.8555240793201133, + "eval_overall_precision": 0.8206521739130435, + "eval_overall_recall": 0.893491124260355, + "eval_runtime": 0.802, + "eval_samples_per_second": 233.165, + "eval_steps_per_second": 3.741, + "step": 2862 + }, + { + "epoch": 28.0, + "grad_norm": 0.023881729692220688, + "learning_rate": 3.6e-05, + "loss": 0.003, + "step": 2968 + }, + { + "epoch": 28.0, + "eval_LOCATION_f1": 0.8344370860927153, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7682926829268293, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7804878048780489, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7384615384615385, + "eval_ORGANIZATION_recall": 0.8275862068965517, + "eval_PERSON_f1": 0.9161290322580645, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8987341772151899, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.78125, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7352941176470589, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2883354723453522, + "eval_overall_accuracy": 0.964404609475032, + "eval_overall_f1": 0.8563380281690142, + "eval_overall_precision": 0.8172043010752689, + "eval_overall_recall": 0.8994082840236687, + "eval_runtime": 0.8155, + "eval_samples_per_second": 229.295, + "eval_steps_per_second": 3.679, + "step": 2968 + }, + { + "epoch": 29.0, + "grad_norm": 0.004700132180005312, + "learning_rate": 3.55e-05, + "loss": 0.0021, + "step": 3074 + }, + { + "epoch": 29.0, + "eval_LOCATION_f1": 0.8571428571428572, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8076923076923077, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7317073170731708, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6923076923076923, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.8996763754045308, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8853503184713376, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2531093657016754, + "eval_overall_accuracy": 0.9651728553137003, + "eval_overall_f1": 0.8530670470756063, + "eval_overall_precision": 0.8236914600550964, + "eval_overall_recall": 0.8846153846153846, + "eval_runtime": 0.8176, + "eval_samples_per_second": 228.73, + "eval_steps_per_second": 3.669, + "step": 3074 + }, + { + "epoch": 30.0, + "grad_norm": 0.1790827363729477, + "learning_rate": 3.5e-05, + "loss": 0.0016, + "step": 3180 + }, + { + "epoch": 30.0, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7590361445783133, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.6434782608695653, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6491228070175439, + "eval_ORGANIZATION_recall": 0.6379310344827587, + "eval_PERSON_f1": 0.910828025477707, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8827160493827161, + "eval_PERSON_recall": 0.9407894736842105, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8253968253968255, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7647058823529411, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.29236629605293274, + "eval_overall_accuracy": 0.9626120358514725, + "eval_overall_f1": 0.8356940509915014, + "eval_overall_precision": 0.8016304347826086, + "eval_overall_recall": 0.8727810650887574, + "eval_runtime": 0.8083, + "eval_samples_per_second": 231.339, + "eval_steps_per_second": 3.711, + "step": 3180 + }, + { + "epoch": 31.0, + "grad_norm": 0.0017360023921355605, + "learning_rate": 3.45e-05, + "loss": 0.0048, + "step": 3286 + }, + { + "epoch": 31.0, + "eval_LOCATION_f1": 0.8724832214765101, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8125, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.6885245901639345, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.65625, + "eval_ORGANIZATION_recall": 0.7241379310344828, + "eval_PERSON_f1": 0.9003215434083601, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8805031446540881, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8253968253968255, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7647058823529411, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2867705523967743, + "eval_overall_accuracy": 0.9626120358514725, + "eval_overall_f1": 0.8446327683615819, + "eval_overall_precision": 0.8081081081081081, + "eval_overall_recall": 0.8846153846153846, + "eval_runtime": 0.8033, + "eval_samples_per_second": 232.803, + "eval_steps_per_second": 3.735, + "step": 3286 + }, + { + "epoch": 32.0, + "grad_norm": 0.009486394003033638, + "learning_rate": 3.4000000000000007e-05, + "loss": 0.0032, + "step": 3392 + }, + { + "epoch": 32.0, + "eval_LOCATION_f1": 0.8243243243243245, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7721518987341772, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.7142857142857142, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6617647058823529, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.8974358974358975, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.875, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.7878787878787877, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7222222222222222, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8125, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7428571428571429, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2836323380470276, + "eval_overall_accuracy": 0.9605633802816902, + "eval_overall_f1": 0.8324022346368716, + "eval_overall_precision": 0.7883597883597884, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8087, + "eval_samples_per_second": 231.245, + "eval_steps_per_second": 3.71, + "step": 3392 + }, + { + "epoch": 33.0, + "grad_norm": 0.008940489031374454, + "learning_rate": 3.35e-05, + "loss": 0.004, + "step": 3498 + }, + { + "epoch": 33.0, + "eval_LOCATION_f1": 0.8611111111111112, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8266666666666667, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.735042735042735, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7288135593220338, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.896774193548387, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.879746835443038, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8253968253968255, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7647058823529411, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.25650379061698914, + "eval_overall_accuracy": 0.9656850192061459, + "eval_overall_f1": 0.8493543758967002, + "eval_overall_precision": 0.8245125348189415, + "eval_overall_recall": 0.8757396449704142, + "eval_runtime": 0.8037, + "eval_samples_per_second": 232.687, + "eval_steps_per_second": 3.733, + "step": 3498 + }, + { + "epoch": 34.0, + "grad_norm": 0.018895745277404785, + "learning_rate": 3.3e-05, + "loss": 0.0016, + "step": 3604 + }, + { + "epoch": 34.0, + "eval_LOCATION_f1": 0.8366013071895425, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7619047619047619, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.6896551724137931, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6896551724137931, + "eval_ORGANIZATION_recall": 0.6896551724137931, + "eval_PERSON_f1": 0.9015873015873016, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8711656441717791, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2746643126010895, + "eval_overall_accuracy": 0.9651728553137003, + "eval_overall_f1": 0.8429985855728428, + "eval_overall_precision": 0.8075880758807588, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8043, + "eval_samples_per_second": 232.493, + "eval_steps_per_second": 3.73, + "step": 3604 + }, + { + "epoch": 35.0, + "grad_norm": 0.0035857518669217825, + "learning_rate": 3.2500000000000004e-05, + "loss": 0.0018, + "step": 3710 + }, + { + "epoch": 35.0, + "eval_LOCATION_f1": 0.8590604026845639, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7479674796747967, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7076923076923077, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.9096774193548387, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8924050632911392, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.870967741935484, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.84375, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.26389142870903015, + "eval_overall_accuracy": 0.9659411011523688, + "eval_overall_f1": 0.8611898016997167, + "eval_overall_precision": 0.8260869565217391, + "eval_overall_recall": 0.8994082840236687, + "eval_runtime": 0.822, + "eval_samples_per_second": 227.49, + "eval_steps_per_second": 3.65, + "step": 3710 + }, + { + "epoch": 36.0, + "grad_norm": 0.0013648144667968154, + "learning_rate": 3.2000000000000005e-05, + "loss": 0.0032, + "step": 3816 + }, + { + "epoch": 36.0, + "eval_LOCATION_f1": 0.8904109589041096, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8441558441558441, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.717948717948718, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.711864406779661, + "eval_ORGANIZATION_recall": 0.7241379310344828, + "eval_PERSON_f1": 0.919093851132686, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.9044585987261147, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8253968253968255, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7647058823529411, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2595536410808563, + "eval_overall_accuracy": 0.9654289372599232, + "eval_overall_f1": 0.860832137733142, + "eval_overall_precision": 0.8356545961002786, + "eval_overall_recall": 0.8875739644970414, + "eval_runtime": 0.8156, + "eval_samples_per_second": 229.278, + "eval_steps_per_second": 3.678, + "step": 3816 + }, + { + "epoch": 37.0, + "grad_norm": 0.001226762542501092, + "learning_rate": 3.15e-05, + "loss": 0.0024, + "step": 3922 + }, + { + "epoch": 37.0, + "eval_LOCATION_f1": 0.882758620689655, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8421052631578947, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.728813559322034, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7166666666666667, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9102564102564101, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8875, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.8125, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7647058823529411, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.847457627118644, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8333333333333334, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.2782364785671234, + "eval_overall_accuracy": 0.9669654289372599, + "eval_overall_f1": 0.8595988538681948, + "eval_overall_precision": 0.8333333333333334, + "eval_overall_recall": 0.8875739644970414, + "eval_runtime": 0.8106, + "eval_samples_per_second": 230.693, + "eval_steps_per_second": 3.701, + "step": 3922 + }, + { + "epoch": 38.0, + "grad_norm": 0.0014669048832729459, + "learning_rate": 3.1e-05, + "loss": 0.002, + "step": 4028 + }, + { + "epoch": 38.0, + "eval_LOCATION_f1": 0.8590604026845639, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7704918032786885, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.734375, + "eval_ORGANIZATION_recall": 0.8103448275862069, + "eval_PERSON_f1": 0.9084967320261438, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.9025974025974026, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.2879778742790222, + "eval_overall_accuracy": 0.9664532650448143, + "eval_overall_f1": 0.8571428571428571, + "eval_overall_precision": 0.8287292817679558, + "eval_overall_recall": 0.8875739644970414, + "eval_runtime": 0.8881, + "eval_samples_per_second": 210.566, + "eval_steps_per_second": 3.378, + "step": 4028 + }, + { + "epoch": 39.0, + "grad_norm": 0.008377453312277794, + "learning_rate": 3.05e-05, + "loss": 0.0027, + "step": 4134 + }, + { + "epoch": 39.0, + "eval_LOCATION_f1": 0.8724832214765101, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8125, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.71875, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6571428571428571, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.8924050632911392, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8597560975609756, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8000000000000002, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8, + "eval_QUANTITY_recall": 0.8, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2859266996383667, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.84593837535014, + "eval_overall_precision": 0.8031914893617021, + "eval_overall_recall": 0.893491124260355, + "eval_runtime": 0.8126, + "eval_samples_per_second": 230.123, + "eval_steps_per_second": 3.692, + "step": 4134 + }, + { + "epoch": 40.0, + "grad_norm": 6.265191078186035, + "learning_rate": 3e-05, + "loss": 0.0028, + "step": 4240 + }, + { + "epoch": 40.0, + "eval_LOCATION_f1": 0.8648648648648648, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.810126582278481, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7704918032786885, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.734375, + "eval_ORGANIZATION_recall": 0.8103448275862069, + "eval_PERSON_f1": 0.9166666666666667, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.89375, + "eval_PERSON_recall": 0.9407894736842105, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.27767661213874817, + "eval_overall_accuracy": 0.9674775928297055, + "eval_overall_f1": 0.8640226628895185, + "eval_overall_precision": 0.8288043478260869, + "eval_overall_recall": 0.9023668639053254, + "eval_runtime": 0.8112, + "eval_samples_per_second": 230.533, + "eval_steps_per_second": 3.698, + "step": 4240 + }, + { + "epoch": 41.0, + "grad_norm": 0.01230549905449152, + "learning_rate": 2.95e-05, + "loss": 0.0013, + "step": 4346 + }, + { + "epoch": 41.0, + "eval_LOCATION_f1": 0.8344370860927153, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7682926829268293, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7540983606557378, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.71875, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.910828025477707, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8827160493827161, + "eval_PERSON_recall": 0.9407894736842105, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8709677419354839, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8181818181818182, + "eval_TIME_recall": 0.9310344827586207, + "eval_loss": 0.27420660853385925, + "eval_overall_accuracy": 0.9667093469910372, + "eval_overall_f1": 0.8579465541490858, + "eval_overall_precision": 0.8176943699731903, + "eval_overall_recall": 0.9023668639053254, + "eval_runtime": 0.804, + "eval_samples_per_second": 232.579, + "eval_steps_per_second": 3.731, + "step": 4346 + }, + { + "epoch": 42.0, + "grad_norm": 0.0334417000412941, + "learning_rate": 2.9e-05, + "loss": 0.0035, + "step": 4452 + }, + { + "epoch": 42.0, + "eval_LOCATION_f1": 0.8904109589041096, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8441558441558441, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7603305785123967, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7301587301587301, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.9050632911392406, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8719512195121951, + "eval_PERSON_recall": 0.9407894736842105, + "eval_QUANTITY_f1": 0.7936507936507938, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7575757575757576, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8571428571428571, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7941176470588235, + "eval_TIME_recall": 0.9310344827586207, + "eval_loss": 0.28786924481391907, + "eval_overall_accuracy": 0.9674775928297055, + "eval_overall_f1": 0.8631875881523273, + "eval_overall_precision": 0.8247978436657682, + "eval_overall_recall": 0.9053254437869822, + "eval_runtime": 0.9089, + "eval_samples_per_second": 205.735, + "eval_steps_per_second": 3.301, + "step": 4452 + }, + { + "epoch": 43.0, + "grad_norm": 0.27700409293174744, + "learning_rate": 2.8499999999999998e-05, + "loss": 0.0014, + "step": 4558 + }, + { + "epoch": 43.0, + "eval_LOCATION_f1": 0.8767123287671235, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8311688311688312, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7580645161290323, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7121212121212122, + "eval_ORGANIZATION_recall": 0.8103448275862069, + "eval_PERSON_f1": 0.877742946708464, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8383233532934131, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.7741935483870969, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.75, + "eval_QUANTITY_recall": 0.8, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2879803478717804, + "eval_overall_accuracy": 0.9651728553137003, + "eval_overall_f1": 0.8443197755960729, + "eval_overall_precision": 0.8026666666666666, + "eval_overall_recall": 0.8905325443786982, + "eval_runtime": 0.8107, + "eval_samples_per_second": 230.668, + "eval_steps_per_second": 3.701, + "step": 4558 + }, + { + "epoch": 44.0, + "grad_norm": 0.5553054213523865, + "learning_rate": 2.8000000000000003e-05, + "loss": 0.002, + "step": 4664 + }, + { + "epoch": 44.0, + "eval_LOCATION_f1": 0.8648648648648648, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.810126582278481, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.796875, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7285714285714285, + "eval_ORGANIZATION_recall": 0.8793103448275862, + "eval_PERSON_f1": 0.9161290322580645, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8987341772151899, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2945367693901062, + "eval_overall_accuracy": 0.9661971830985916, + "eval_overall_f1": 0.867605633802817, + "eval_overall_precision": 0.8279569892473119, + "eval_overall_recall": 0.9112426035502958, + "eval_runtime": 0.8052, + "eval_samples_per_second": 232.233, + "eval_steps_per_second": 3.726, + "step": 4664 + }, + { + "epoch": 45.0, + "grad_norm": 0.12713950872421265, + "learning_rate": 2.7500000000000004e-05, + "loss": 0.003, + "step": 4770 + }, + { + "epoch": 45.0, + "eval_LOCATION_f1": 0.8311688311688311, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7529411764705882, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7226890756302522, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7049180327868853, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9155844155844156, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.9038461538461539, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.819672131147541, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8064516129032258, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8813559322033899, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8666666666666667, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2897718548774719, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.8530670470756063, + "eval_overall_precision": 0.8236914600550964, + "eval_overall_recall": 0.8846153846153846, + "eval_runtime": 0.8046, + "eval_samples_per_second": 232.414, + "eval_steps_per_second": 3.729, + "step": 4770 + }, + { + "epoch": 46.0, + "grad_norm": 0.0031549884006381035, + "learning_rate": 2.7000000000000002e-05, + "loss": 0.0029, + "step": 4876 + }, + { + "epoch": 46.0, + "eval_LOCATION_f1": 0.8441558441558441, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7647058823529411, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.8125, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7428571428571429, + "eval_ORGANIZATION_recall": 0.896551724137931, + "eval_PERSON_f1": 0.9067524115755626, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8867924528301887, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.870967741935484, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.84375, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8125, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7428571428571429, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.310619056224823, + "eval_overall_accuracy": 0.9654289372599232, + "eval_overall_f1": 0.8650904033379694, + "eval_overall_precision": 0.8162729658792651, + "eval_overall_recall": 0.9201183431952663, + "eval_runtime": 0.8131, + "eval_samples_per_second": 229.995, + "eval_steps_per_second": 3.69, + "step": 4876 + }, + { + "epoch": 47.0, + "grad_norm": 0.037439510226249695, + "learning_rate": 2.6500000000000004e-05, + "loss": 0.0033, + "step": 4982 + }, + { + "epoch": 47.0, + "eval_LOCATION_f1": 0.8840579710144928, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8840579710144928, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.6788990825688075, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7254901960784313, + "eval_ORGANIZATION_recall": 0.6379310344827587, + "eval_PERSON_f1": 0.9215686274509804, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.9155844155844156, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8524590163934426, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8387096774193549, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8620689655172413, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8620689655172413, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.26650553941726685, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.8630952380952381, + "eval_overall_precision": 0.8682634730538922, + "eval_overall_recall": 0.8579881656804734, + "eval_runtime": 0.8111, + "eval_samples_per_second": 230.541, + "eval_steps_per_second": 3.699, + "step": 4982 + }, + { + "epoch": 48.0, + "grad_norm": 0.005395154468715191, + "learning_rate": 2.6000000000000002e-05, + "loss": 0.0027, + "step": 5088 + }, + { + "epoch": 48.0, + "eval_LOCATION_f1": 0.8311688311688311, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7529411764705882, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7538461538461538, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6805555555555556, + "eval_ORGANIZATION_recall": 0.8448275862068966, + "eval_PERSON_f1": 0.896774193548387, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.879746835443038, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3204702138900757, + "eval_overall_accuracy": 0.9605633802816902, + "eval_overall_f1": 0.8467966573816157, + "eval_overall_precision": 0.8, + "eval_overall_recall": 0.8994082840236687, + "eval_runtime": 0.8068, + "eval_samples_per_second": 231.778, + "eval_steps_per_second": 3.718, + "step": 5088 + }, + { + "epoch": 49.0, + "grad_norm": 0.010527399368584156, + "learning_rate": 2.5500000000000003e-05, + "loss": 0.0014, + "step": 5194 + }, + { + "epoch": 49.0, + "eval_LOCATION_f1": 0.8724832214765101, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8125, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7419354838709677, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.696969696969697, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.9131832797427653, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8930817610062893, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.28002333641052246, + "eval_overall_accuracy": 0.9656850192061459, + "eval_overall_f1": 0.8640226628895185, + "eval_overall_precision": 0.8288043478260869, + "eval_overall_recall": 0.9023668639053254, + "eval_runtime": 0.8074, + "eval_samples_per_second": 231.603, + "eval_steps_per_second": 3.716, + "step": 5194 + }, + { + "epoch": 50.0, + "grad_norm": 0.0005556904943659902, + "learning_rate": 2.5e-05, + "loss": 0.0005, + "step": 5300 + }, + { + "epoch": 50.0, + "eval_LOCATION_f1": 0.8590604026845639, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7441860465116279, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.676056338028169, + "eval_ORGANIZATION_recall": 0.8275862068965517, + "eval_PERSON_f1": 0.9067524115755626, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8867924528301887, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.30621612071990967, + "eval_overall_accuracy": 0.9633802816901409, + "eval_overall_f1": 0.8579465541490858, + "eval_overall_precision": 0.8176943699731903, + "eval_overall_recall": 0.9023668639053254, + "eval_runtime": 0.8061, + "eval_samples_per_second": 231.983, + "eval_steps_per_second": 3.722, + "step": 5300 + }, + { + "epoch": 51.0, + "grad_norm": 0.002213704166933894, + "learning_rate": 2.45e-05, + "loss": 0.0009, + "step": 5406 + }, + { + "epoch": 51.0, + "eval_LOCATION_f1": 0.8356164383561644, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.7922077922077922, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.7200000000000001, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6716417910447762, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.8974358974358975, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.875, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3094327747821808, + "eval_overall_accuracy": 0.9615877080665813, + "eval_overall_f1": 0.8429985855728428, + "eval_overall_precision": 0.8075880758807588, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8118, + "eval_samples_per_second": 230.354, + "eval_steps_per_second": 3.696, + "step": 5406 + }, + { + "epoch": 52.0, + "grad_norm": 0.12124722450971603, + "learning_rate": 2.4e-05, + "loss": 0.0007, + "step": 5512 + }, + { + "epoch": 52.0, + "eval_LOCATION_f1": 0.8493150684931507, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.7226890756302522, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7049180327868853, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9003215434083601, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8805031446540881, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.870967741935484, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.84375, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2926962077617645, + "eval_overall_accuracy": 0.9651728553137003, + "eval_overall_f1": 0.8538681948424068, + "eval_overall_precision": 0.8277777777777777, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8047, + "eval_samples_per_second": 232.378, + "eval_steps_per_second": 3.728, + "step": 5512 + }, + { + "epoch": 53.0, + "grad_norm": 0.007010570261627436, + "learning_rate": 2.35e-05, + "loss": 0.0005, + "step": 5618 + }, + { + "epoch": 53.0, + "eval_LOCATION_f1": 0.8413793103448277, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8026315789473685, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.7166666666666668, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6935483870967742, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9038461538461539, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.88125, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3106415271759033, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.8497854077253219, + "eval_overall_precision": 0.8227146814404432, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.8081, + "eval_samples_per_second": 231.4, + "eval_steps_per_second": 3.712, + "step": 5618 + }, + { + "epoch": 54.0, + "grad_norm": 0.0005368912825360894, + "learning_rate": 2.3000000000000003e-05, + "loss": 0.0006, + "step": 5724 + }, + { + "epoch": 54.0, + "eval_LOCATION_f1": 0.8472222222222223, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8133333333333334, + "eval_LOCATION_recall": 0.8840579710144928, + "eval_ORGANIZATION_f1": 0.7241379310344829, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7241379310344828, + "eval_ORGANIZATION_recall": 0.7241379310344828, + "eval_PERSON_f1": 0.9102564102564101, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8875, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3165185749530792, + "eval_overall_accuracy": 0.9649167733674776, + "eval_overall_f1": 0.8546762589928059, + "eval_overall_precision": 0.8319327731092437, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.8064, + "eval_samples_per_second": 231.905, + "eval_steps_per_second": 3.72, + "step": 5724 + }, + { + "epoch": 55.0, + "grad_norm": 0.0005507151363417506, + "learning_rate": 2.25e-05, + "loss": 0.0008, + "step": 5830 + }, + { + "epoch": 55.0, + "eval_LOCATION_f1": 0.8920863309352518, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8857142857142857, + "eval_LOCATION_recall": 0.8985507246376812, + "eval_ORGANIZATION_f1": 0.6915887850467289, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7551020408163265, + "eval_ORGANIZATION_recall": 0.6379310344827587, + "eval_PERSON_f1": 0.9061488673139159, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.89171974522293, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8813559322033899, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8666666666666667, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.28772225975990295, + "eval_overall_accuracy": 0.9677336747759283, + "eval_overall_f1": 0.8579881656804734, + "eval_overall_precision": 0.8579881656804734, + "eval_overall_recall": 0.8579881656804734, + "eval_runtime": 0.8028, + "eval_samples_per_second": 232.926, + "eval_steps_per_second": 3.737, + "step": 5830 + }, + { + "epoch": 56.0, + "grad_norm": 0.004189824219793081, + "learning_rate": 2.2000000000000003e-05, + "loss": 0.0013, + "step": 5936 + }, + { + "epoch": 56.0, + "eval_LOCATION_f1": 0.8965517241379309, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8552631578947368, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.6956521739130435, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7017543859649122, + "eval_ORGANIZATION_recall": 0.6896551724137931, + "eval_PERSON_f1": 0.9126213592233009, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8980891719745223, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8524590163934426, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8387096774193549, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.2933734357357025, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.861271676300578, + "eval_overall_precision": 0.8418079096045198, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8184, + "eval_samples_per_second": 228.501, + "eval_steps_per_second": 3.666, + "step": 5936 + }, + { + "epoch": 57.0, + "grad_norm": 0.00032704288605600595, + "learning_rate": 2.15e-05, + "loss": 0.0003, + "step": 6042 + }, + { + "epoch": 57.0, + "eval_LOCATION_f1": 0.8904109589041096, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8441558441558441, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.6956521739130435, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7017543859649122, + "eval_ORGANIZATION_recall": 0.6896551724137931, + "eval_PERSON_f1": 0.9096774193548387, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8924050632911392, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.31640374660491943, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.8563218390804598, + "eval_overall_precision": 0.8324022346368715, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8095, + "eval_samples_per_second": 231.007, + "eval_steps_per_second": 3.706, + "step": 6042 + }, + { + "epoch": 58.0, + "grad_norm": 0.0005215631099417806, + "learning_rate": 2.1e-05, + "loss": 0.0004, + "step": 6148 + }, + { + "epoch": 58.0, + "eval_LOCATION_f1": 0.8843537414965987, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8333333333333334, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7107438016528926, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6825396825396826, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9096774193548387, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8924050632911392, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.32982975244522095, + "eval_overall_accuracy": 0.9628681177976952, + "eval_overall_f1": 0.8575498575498575, + "eval_overall_precision": 0.8269230769230769, + "eval_overall_recall": 0.8905325443786982, + "eval_runtime": 0.8776, + "eval_samples_per_second": 213.09, + "eval_steps_per_second": 3.419, + "step": 6148 + }, + { + "epoch": 59.0, + "grad_norm": 0.13604550063610077, + "learning_rate": 2.05e-05, + "loss": 0.0006, + "step": 6254 + }, + { + "epoch": 59.0, + "eval_LOCATION_f1": 0.8965517241379309, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8552631578947368, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.6371681415929203, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6545454545454545, + "eval_ORGANIZATION_recall": 0.6206896551724138, + "eval_PERSON_f1": 0.9131832797427653, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8930817610062893, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3474750220775604, + "eval_overall_accuracy": 0.9618437900128041, + "eval_overall_f1": 0.8513708513708513, + "eval_overall_precision": 0.8309859154929577, + "eval_overall_recall": 0.8727810650887574, + "eval_runtime": 0.812, + "eval_samples_per_second": 230.289, + "eval_steps_per_second": 3.694, + "step": 6254 + }, + { + "epoch": 60.0, + "grad_norm": 0.0007290157955139875, + "learning_rate": 2e-05, + "loss": 0.0009, + "step": 6360 + }, + { + "epoch": 60.0, + "eval_LOCATION_f1": 0.8783783783783783, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8227848101265823, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7731092436974789, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7540983606557377, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.9096774193548387, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8924050632911392, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3445851802825928, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.8673323823109843, + "eval_overall_precision": 0.837465564738292, + "eval_overall_recall": 0.8994082840236687, + "eval_runtime": 0.8135, + "eval_samples_per_second": 229.871, + "eval_steps_per_second": 3.688, + "step": 6360 + }, + { + "epoch": 61.0, + "grad_norm": 0.01683318056166172, + "learning_rate": 1.9500000000000003e-05, + "loss": 0.0005, + "step": 6466 + }, + { + "epoch": 61.0, + "eval_LOCATION_f1": 0.8666666666666666, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8024691358024691, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7200000000000001, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6716417910447762, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.9003215434083601, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8805031446540881, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3661682605743408, + "eval_overall_accuracy": 0.9610755441741358, + "eval_overall_f1": 0.8519040902679831, + "eval_overall_precision": 0.8140161725067385, + "eval_overall_recall": 0.893491124260355, + "eval_runtime": 0.8073, + "eval_samples_per_second": 231.639, + "eval_steps_per_second": 3.716, + "step": 6466 + }, + { + "epoch": 62.0, + "grad_norm": 0.0029261417221277952, + "learning_rate": 1.9e-05, + "loss": 0.002, + "step": 6572 + }, + { + "epoch": 62.0, + "eval_LOCATION_f1": 0.8965517241379309, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8552631578947368, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7377049180327868, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.703125, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.9067524115755626, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8867924528301887, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.7936507936507938, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7575757575757576, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.31876397132873535, + "eval_overall_accuracy": 0.9664532650448143, + "eval_overall_f1": 0.861626248216833, + "eval_overall_precision": 0.8319559228650137, + "eval_overall_recall": 0.893491124260355, + "eval_runtime": 0.8044, + "eval_samples_per_second": 232.462, + "eval_steps_per_second": 3.729, + "step": 6572 + }, + { + "epoch": 63.0, + "grad_norm": 0.0014877787325531244, + "learning_rate": 1.85e-05, + "loss": 0.0005, + "step": 6678 + }, + { + "epoch": 63.0, + "eval_LOCATION_f1": 0.8951048951048951, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8648648648648649, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7603305785123967, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7301587301587301, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.9003215434083601, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8805031446540881, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.819672131147541, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8064516129032258, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3222368061542511, + "eval_overall_accuracy": 0.9669654289372599, + "eval_overall_f1": 0.864942528735632, + "eval_overall_precision": 0.840782122905028, + "eval_overall_recall": 0.8905325443786982, + "eval_runtime": 0.8114, + "eval_samples_per_second": 230.457, + "eval_steps_per_second": 3.697, + "step": 6678 + }, + { + "epoch": 64.0, + "grad_norm": 0.000210550642805174, + "learning_rate": 1.8e-05, + "loss": 0.0003, + "step": 6784 + }, + { + "epoch": 64.0, + "eval_LOCATION_f1": 0.8767123287671235, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8311688311688312, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7642276422764227, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7230769230769231, + "eval_ORGANIZATION_recall": 0.8103448275862069, + "eval_PERSON_f1": 0.9003215434083601, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8805031446540881, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.32881781458854675, + "eval_overall_accuracy": 0.9661971830985916, + "eval_overall_f1": 0.8603988603988605, + "eval_overall_precision": 0.8296703296703297, + "eval_overall_recall": 0.893491124260355, + "eval_runtime": 0.8114, + "eval_samples_per_second": 230.476, + "eval_steps_per_second": 3.697, + "step": 6784 + }, + { + "epoch": 65.0, + "grad_norm": 0.0021329650189727545, + "learning_rate": 1.75e-05, + "loss": 0.0003, + "step": 6890 + }, + { + "epoch": 65.0, + "eval_LOCATION_f1": 0.8767123287671235, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8311688311688312, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7704918032786885, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.734375, + "eval_ORGANIZATION_recall": 0.8103448275862069, + "eval_PERSON_f1": 0.8987341772151899, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8658536585365854, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.33311548829078674, + "eval_overall_accuracy": 0.9661971830985916, + "eval_overall_f1": 0.8628005657708628, + "eval_overall_precision": 0.8265582655826558, + "eval_overall_recall": 0.9023668639053254, + "eval_runtime": 0.8037, + "eval_samples_per_second": 232.685, + "eval_steps_per_second": 3.733, + "step": 6890 + }, + { + "epoch": 66.0, + "grad_norm": 0.0006951324758119881, + "learning_rate": 1.7000000000000003e-05, + "loss": 0.0003, + "step": 6996 + }, + { + "epoch": 66.0, + "eval_LOCATION_f1": 0.881118881118881, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8513513513513513, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.6666666666666667, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6981132075471698, + "eval_ORGANIZATION_recall": 0.6379310344827587, + "eval_PERSON_f1": 0.9090909090909091, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8974358974358975, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8666666666666666, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8387096774193549, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.31618252396583557, + "eval_overall_accuracy": 0.9661971830985916, + "eval_overall_f1": 0.8525547445255474, + "eval_overall_precision": 0.8414985590778098, + "eval_overall_recall": 0.863905325443787, + "eval_runtime": 0.8125, + "eval_samples_per_second": 230.14, + "eval_steps_per_second": 3.692, + "step": 6996 + }, + { + "epoch": 67.0, + "grad_norm": 0.0028227961156517267, + "learning_rate": 1.65e-05, + "loss": 0.0024, + "step": 7102 + }, + { + "epoch": 67.0, + "eval_LOCATION_f1": 0.863013698630137, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8181818181818182, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7438016528925621, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7142857142857143, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.9114754098360655, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.9084967320261438, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3060024380683899, + "eval_overall_accuracy": 0.9672215108834827, + "eval_overall_f1": 0.8575539568345324, + "eval_overall_precision": 0.834733893557423, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8036, + "eval_samples_per_second": 232.709, + "eval_steps_per_second": 3.733, + "step": 7102 + }, + { + "epoch": 68.0, + "grad_norm": 0.0007019271142780781, + "learning_rate": 1.6000000000000003e-05, + "loss": 0.002, + "step": 7208 + }, + { + "epoch": 68.0, + "eval_LOCATION_f1": 0.8904109589041096, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8441558441558441, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.6851851851851852, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.74, + "eval_ORGANIZATION_recall": 0.6379310344827587, + "eval_PERSON_f1": 0.9155844155844156, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.9038461538461539, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8387096774193549, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7878787878787878, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.3085281252861023, + "eval_overall_accuracy": 0.9651728553137003, + "eval_overall_f1": 0.8600583090379009, + "eval_overall_precision": 0.8477011494252874, + "eval_overall_recall": 0.8727810650887574, + "eval_runtime": 0.8099, + "eval_samples_per_second": 230.884, + "eval_steps_per_second": 3.704, + "step": 7208 + }, + { + "epoch": 69.0, + "grad_norm": 13.608760833740234, + "learning_rate": 1.55e-05, + "loss": 0.0014, + "step": 7314 + }, + { + "epoch": 69.0, + "eval_LOCATION_f1": 0.8904109589041096, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8441558441558441, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7086614173228347, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6521739130434783, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.89171974522293, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8641975308641975, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.888888888888889, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8484848484848485, + "eval_QUANTITY_recall": 0.9333333333333333, + "eval_TIME_f1": 0.8524590163934426, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.8125, + "eval_TIME_recall": 0.896551724137931, + "eval_loss": 0.30335918068885803, + "eval_overall_accuracy": 0.9649167733674776, + "eval_overall_f1": 0.8551336146272854, + "eval_overall_precision": 0.8150134048257373, + "eval_overall_recall": 0.8994082840236687, + "eval_runtime": 0.8074, + "eval_samples_per_second": 231.614, + "eval_steps_per_second": 3.716, + "step": 7314 + }, + { + "epoch": 70.0, + "grad_norm": 0.00710656400769949, + "learning_rate": 1.5e-05, + "loss": 0.0006, + "step": 7420 + }, + { + "epoch": 70.0, + "eval_LOCATION_f1": 0.882758620689655, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8421052631578947, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7244094488188977, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6666666666666666, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.888888888888889, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8588957055214724, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8064516129032258, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7575757575757576, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3125246465206146, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.8466947960618846, + "eval_overall_precision": 0.806970509383378, + "eval_overall_recall": 0.8905325443786982, + "eval_runtime": 0.8058, + "eval_samples_per_second": 232.071, + "eval_steps_per_second": 3.723, + "step": 7420 + }, + { + "epoch": 71.0, + "grad_norm": 0.00047848603571765125, + "learning_rate": 1.45e-05, + "loss": 0.0009, + "step": 7526 + }, + { + "epoch": 71.0, + "eval_LOCATION_f1": 0.8749999999999999, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.84, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7301587301587301, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6764705882352942, + "eval_ORGANIZATION_recall": 0.7931034482758621, + "eval_PERSON_f1": 0.8952380952380953, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8650306748466258, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8125, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7647058823529411, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.7666666666666667, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.7419354838709677, + "eval_TIME_recall": 0.7931034482758621, + "eval_loss": 0.3196626901626587, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.843441466854725, + "eval_overall_precision": 0.8059299191374663, + "eval_overall_recall": 0.8846153846153846, + "eval_runtime": 0.8027, + "eval_samples_per_second": 232.972, + "eval_steps_per_second": 3.738, + "step": 7526 + }, + { + "epoch": 72.0, + "grad_norm": 0.002629638649523258, + "learning_rate": 1.4000000000000001e-05, + "loss": 0.0009, + "step": 7632 + }, + { + "epoch": 72.0, + "eval_LOCATION_f1": 0.882758620689655, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8421052631578947, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7317073170731708, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6923076923076923, + "eval_ORGANIZATION_recall": 0.7758620689655172, + "eval_PERSON_f1": 0.9073482428115016, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8819875776397516, + "eval_PERSON_recall": 0.9342105263157895, + "eval_QUANTITY_f1": 0.8125, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7647058823529411, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.7868852459016394, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.75, + "eval_TIME_recall": 0.8275862068965517, + "eval_loss": 0.3206939697265625, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.8526912181303117, + "eval_overall_precision": 0.8179347826086957, + "eval_overall_recall": 0.8905325443786982, + "eval_runtime": 0.8794, + "eval_samples_per_second": 212.64, + "eval_steps_per_second": 3.411, + "step": 7632 + }, + { + "epoch": 73.0, + "grad_norm": 0.0006528229569084942, + "learning_rate": 1.3500000000000001e-05, + "loss": 0.0006, + "step": 7738 + }, + { + "epoch": 73.0, + "eval_LOCATION_f1": 0.8767123287671235, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8311688311688312, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7049180327868853, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.671875, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9061488673139159, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.89171974522293, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.32062897086143494, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.8502139800285307, + "eval_overall_precision": 0.8209366391184573, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8113, + "eval_samples_per_second": 230.503, + "eval_steps_per_second": 3.698, + "step": 7738 + }, + { + "epoch": 74.0, + "grad_norm": 0.0003340624098200351, + "learning_rate": 1.3000000000000001e-05, + "loss": 0.0004, + "step": 7844 + }, + { + "epoch": 74.0, + "eval_LOCATION_f1": 0.8767123287671235, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8311688311688312, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7213114754098361, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6875, + "eval_ORGANIZATION_recall": 0.7586206896551724, + "eval_PERSON_f1": 0.8990228013029316, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8903225806451613, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.32088541984558105, + "eval_overall_accuracy": 0.9641485275288092, + "eval_overall_f1": 0.8497854077253219, + "eval_overall_precision": 0.8227146814404432, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.8194, + "eval_samples_per_second": 228.212, + "eval_steps_per_second": 3.661, + "step": 7844 + }, + { + "epoch": 75.0, + "grad_norm": 0.0001975786144612357, + "learning_rate": 1.25e-05, + "loss": 0.0003, + "step": 7950 + }, + { + "epoch": 75.0, + "eval_LOCATION_f1": 0.8936170212765957, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.875, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.6991869918699186, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6615384615384615, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.8996763754045308, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8853503184713376, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.32191890478134155, + "eval_overall_accuracy": 0.9636363636363636, + "eval_overall_f1": 0.8493543758967002, + "eval_overall_precision": 0.8245125348189415, + "eval_overall_recall": 0.8757396449704142, + "eval_runtime": 0.7893, + "eval_samples_per_second": 236.92, + "eval_steps_per_second": 3.801, + "step": 7950 + }, + { + "epoch": 76.0, + "grad_norm": 0.0004086096887476742, + "learning_rate": 1.2e-05, + "loss": 0.0003, + "step": 8056 + }, + { + "epoch": 76.0, + "eval_LOCATION_f1": 0.8767123287671235, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8311688311688312, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.732824427480916, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6575342465753424, + "eval_ORGANIZATION_recall": 0.8275862068965517, + "eval_PERSON_f1": 0.9038461538461539, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.88125, + "eval_PERSON_recall": 0.9276315789473685, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3355537950992584, + "eval_overall_accuracy": 0.963124199743918, + "eval_overall_f1": 0.85273492286115, + "eval_overall_precision": 0.8106666666666666, + "eval_overall_recall": 0.8994082840236687, + "eval_runtime": 0.8123, + "eval_samples_per_second": 230.209, + "eval_steps_per_second": 3.693, + "step": 8056 + }, + { + "epoch": 77.0, + "grad_norm": 0.000383577193133533, + "learning_rate": 1.1500000000000002e-05, + "loss": 0.0002, + "step": 8162 + }, + { + "epoch": 77.0, + "eval_LOCATION_f1": 0.8951048951048951, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8648648648648649, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7166666666666668, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6935483870967742, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9003215434083601, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8805031446540881, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3264581859111786, + "eval_overall_accuracy": 0.9656850192061459, + "eval_overall_f1": 0.8550932568149211, + "eval_overall_precision": 0.83008356545961, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8006, + "eval_samples_per_second": 233.575, + "eval_steps_per_second": 3.747, + "step": 8162 + }, + { + "epoch": 78.0, + "grad_norm": 0.0004785690689459443, + "learning_rate": 1.1000000000000001e-05, + "loss": 0.0002, + "step": 8268 + }, + { + "epoch": 78.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7213114754098361, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6875, + "eval_ORGANIZATION_recall": 0.7586206896551724, + "eval_PERSON_f1": 0.9003215434083601, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8805031446540881, + "eval_PERSON_recall": 0.9210526315789473, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.32919907569885254, + "eval_overall_accuracy": 0.9649167733674776, + "eval_overall_f1": 0.8530670470756063, + "eval_overall_precision": 0.8236914600550964, + "eval_overall_recall": 0.8846153846153846, + "eval_runtime": 0.7937, + "eval_samples_per_second": 235.609, + "eval_steps_per_second": 3.78, + "step": 8268 + }, + { + "epoch": 79.0, + "grad_norm": 0.8365729451179504, + "learning_rate": 1.05e-05, + "loss": 0.0003, + "step": 8374 + }, + { + "epoch": 79.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7154471544715447, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.676923076923077, + "eval_ORGANIZATION_recall": 0.7586206896551724, + "eval_PERSON_f1": 0.891025641025641, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.86875, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.333362877368927, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.8490028490028488, + "eval_overall_precision": 0.8186813186813187, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8323, + "eval_samples_per_second": 224.68, + "eval_steps_per_second": 3.604, + "step": 8374 + }, + { + "epoch": 80.0, + "grad_norm": 0.0004933515447191894, + "learning_rate": 1e-05, + "loss": 0.0006, + "step": 8480 + }, + { + "epoch": 80.0, + "eval_LOCATION_f1": 0.8951048951048951, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8648648648648649, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.6890756302521007, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6721311475409836, + "eval_ORGANIZATION_recall": 0.7068965517241379, + "eval_PERSON_f1": 0.9055374592833876, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.896774193548387, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.870967741935484, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.84375, + "eval_QUANTITY_recall": 0.9, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.33931657671928406, + "eval_overall_accuracy": 0.9646606914212548, + "eval_overall_f1": 0.8554913294797689, + "eval_overall_precision": 0.8361581920903954, + "eval_overall_recall": 0.8757396449704142, + "eval_runtime": 0.8001, + "eval_samples_per_second": 233.722, + "eval_steps_per_second": 3.75, + "step": 8480 + }, + { + "epoch": 81.0, + "grad_norm": 0.0009226278634741902, + "learning_rate": 9.5e-06, + "loss": 0.0002, + "step": 8586 + }, + { + "epoch": 81.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7213114754098361, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6875, + "eval_ORGANIZATION_recall": 0.7586206896551724, + "eval_PERSON_f1": 0.8990228013029316, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8903225806451613, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8253968253968254, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.7878787878787878, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3536657691001892, + "eval_overall_accuracy": 0.964404609475032, + "eval_overall_f1": 0.8522238163558107, + "eval_overall_precision": 0.8272980501392758, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.8023, + "eval_samples_per_second": 233.087, + "eval_steps_per_second": 3.739, + "step": 8586 + }, + { + "epoch": 82.0, + "grad_norm": 0.001014114823192358, + "learning_rate": 9e-06, + "loss": 0.0003, + "step": 8692 + }, + { + "epoch": 82.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.719298245614035, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7321428571428571, + "eval_ORGANIZATION_recall": 0.7068965517241379, + "eval_PERSON_f1": 0.8961038961038961, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8846153846153846, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3606484830379486, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.8505079825834543, + "eval_overall_precision": 0.8347578347578347, + "eval_overall_recall": 0.8668639053254438, + "eval_runtime": 0.8129, + "eval_samples_per_second": 230.048, + "eval_steps_per_second": 3.691, + "step": 8692 + }, + { + "epoch": 83.0, + "grad_norm": 0.0005941664567217231, + "learning_rate": 8.500000000000002e-06, + "loss": 0.0006, + "step": 8798 + }, + { + "epoch": 83.0, + "eval_LOCATION_f1": 0.9090909090909092, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8783783783783784, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.6545454545454545, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6923076923076923, + "eval_ORGANIZATION_recall": 0.6206896551724138, + "eval_PERSON_f1": 0.9055374592833876, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.896774193548387, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.35767465829849243, + "eval_overall_accuracy": 0.9641485275288092, + "eval_overall_f1": 0.8491947291361641, + "eval_overall_precision": 0.8405797101449275, + "eval_overall_recall": 0.8579881656804734, + "eval_runtime": 0.8106, + "eval_samples_per_second": 230.7, + "eval_steps_per_second": 3.701, + "step": 8798 + }, + { + "epoch": 84.0, + "grad_norm": 0.0007156149367801845, + "learning_rate": 8.000000000000001e-06, + "loss": 0.001, + "step": 8904 + }, + { + "epoch": 84.0, + "eval_LOCATION_f1": 0.9027777777777778, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8666666666666667, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.6548672566371682, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6727272727272727, + "eval_ORGANIZATION_recall": 0.6379310344827587, + "eval_PERSON_f1": 0.8961038961038961, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8846153846153846, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8064516129032259, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.78125, + "eval_QUANTITY_recall": 0.8333333333333334, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.36741259694099426, + "eval_overall_accuracy": 0.9618437900128041, + "eval_overall_f1": 0.8430232558139535, + "eval_overall_precision": 0.8285714285714286, + "eval_overall_recall": 0.8579881656804734, + "eval_runtime": 0.799, + "eval_samples_per_second": 234.039, + "eval_steps_per_second": 3.755, + "step": 8904 + }, + { + "epoch": 85.0, + "grad_norm": 0.00027448913897387683, + "learning_rate": 7.5e-06, + "loss": 0.0006, + "step": 9010 + }, + { + "epoch": 85.0, + "eval_LOCATION_f1": 0.9090909090909092, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8783783783783784, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.6725663716814159, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6909090909090909, + "eval_ORGANIZATION_recall": 0.6551724137931034, + "eval_PERSON_f1": 0.8932038834951456, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8789808917197452, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.36387643218040466, + "eval_overall_accuracy": 0.9615877080665813, + "eval_overall_f1": 0.8488372093023255, + "eval_overall_precision": 0.8342857142857143, + "eval_overall_recall": 0.863905325443787, + "eval_runtime": 0.8034, + "eval_samples_per_second": 232.767, + "eval_steps_per_second": 3.734, + "step": 9010 + }, + { + "epoch": 86.0, + "grad_norm": 0.0002620484447106719, + "learning_rate": 7.000000000000001e-06, + "loss": 0.0004, + "step": 9116 + }, + { + "epoch": 86.0, + "eval_LOCATION_f1": 0.8936170212765957, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.875, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.6851851851851852, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.74, + "eval_ORGANIZATION_recall": 0.6379310344827587, + "eval_PERSON_f1": 0.8996763754045308, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8853503184713376, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3683052957057953, + "eval_overall_accuracy": 0.9633802816901409, + "eval_overall_f1": 0.8516886930983848, + "eval_overall_precision": 0.8454810495626822, + "eval_overall_recall": 0.8579881656804734, + "eval_runtime": 0.796, + "eval_samples_per_second": 234.923, + "eval_steps_per_second": 3.769, + "step": 9116 + }, + { + "epoch": 87.0, + "grad_norm": 0.00031526130624115467, + "learning_rate": 6.5000000000000004e-06, + "loss": 0.0005, + "step": 9222 + }, + { + "epoch": 87.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.6846846846846846, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7169811320754716, + "eval_ORGANIZATION_recall": 0.6551724137931034, + "eval_PERSON_f1": 0.8961038961038961, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8846153846153846, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.35311439633369446, + "eval_overall_accuracy": 0.9626120358514725, + "eval_overall_f1": 0.8483965014577258, + "eval_overall_precision": 0.8362068965517241, + "eval_overall_recall": 0.8609467455621301, + "eval_runtime": 0.7988, + "eval_samples_per_second": 234.112, + "eval_steps_per_second": 3.756, + "step": 9222 + }, + { + "epoch": 88.0, + "grad_norm": 0.0015132308471947908, + "learning_rate": 6e-06, + "loss": 0.0002, + "step": 9328 + }, + { + "epoch": 88.0, + "eval_LOCATION_f1": 0.881118881118881, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8513513513513513, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.6909090909090909, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7307692307692307, + "eval_ORGANIZATION_recall": 0.6551724137931034, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3533298671245575, + "eval_overall_accuracy": 0.9633802816901409, + "eval_overall_f1": 0.8508771929824561, + "eval_overall_precision": 0.8410404624277457, + "eval_overall_recall": 0.8609467455621301, + "eval_runtime": 0.8072, + "eval_samples_per_second": 231.657, + "eval_steps_per_second": 3.716, + "step": 9328 + }, + { + "epoch": 89.0, + "grad_norm": 0.00042143117752857506, + "learning_rate": 5.500000000000001e-06, + "loss": 0.0002, + "step": 9434 + }, + { + "epoch": 89.0, + "eval_LOCATION_f1": 0.881118881118881, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8513513513513513, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.719298245614035, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7321428571428571, + "eval_ORGANIZATION_recall": 0.7068965517241379, + "eval_PERSON_f1": 0.8961038961038961, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8846153846153846, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.35247281193733215, + "eval_overall_accuracy": 0.9636363636363636, + "eval_overall_f1": 0.8517441860465117, + "eval_overall_precision": 0.8371428571428572, + "eval_overall_recall": 0.8668639053254438, + "eval_runtime": 0.8068, + "eval_samples_per_second": 231.777, + "eval_steps_per_second": 3.718, + "step": 9434 + }, + { + "epoch": 90.0, + "grad_norm": 0.0002251994446851313, + "learning_rate": 5e-06, + "loss": 0.0002, + "step": 9540 + }, + { + "epoch": 90.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7241379310344829, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7241379310344828, + "eval_ORGANIZATION_recall": 0.7241379310344828, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.35829171538352966, + "eval_overall_accuracy": 0.9633802816901409, + "eval_overall_f1": 0.8567293777134587, + "eval_overall_precision": 0.8385269121813032, + "eval_overall_recall": 0.8757396449704142, + "eval_runtime": 0.813, + "eval_samples_per_second": 230.023, + "eval_steps_per_second": 3.69, + "step": 9540 + }, + { + "epoch": 91.0, + "grad_norm": 0.0003033955581486225, + "learning_rate": 4.5e-06, + "loss": 0.0002, + "step": 9646 + }, + { + "epoch": 91.0, + "eval_LOCATION_f1": 0.8965517241379309, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8552631578947368, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.735042735042735, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7288135593220338, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.8961038961038961, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8846153846153846, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3626328408718109, + "eval_overall_accuracy": 0.963124199743918, + "eval_overall_f1": 0.8571428571428573, + "eval_overall_precision": 0.8366197183098592, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.791, + "eval_samples_per_second": 236.421, + "eval_steps_per_second": 3.793, + "step": 9646 + }, + { + "epoch": 92.0, + "grad_norm": 0.00020177336409687996, + "learning_rate": 4.000000000000001e-06, + "loss": 0.0005, + "step": 9752 + }, + { + "epoch": 92.0, + "eval_LOCATION_f1": 0.881118881118881, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8513513513513513, + "eval_LOCATION_recall": 0.9130434782608695, + "eval_ORGANIZATION_f1": 0.7304347826086957, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7368421052631579, + "eval_ORGANIZATION_recall": 0.7241379310344828, + "eval_PERSON_f1": 0.8961038961038961, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8846153846153846, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3607942759990692, + "eval_overall_accuracy": 0.9633802816901409, + "eval_overall_f1": 0.8534107402031931, + "eval_overall_precision": 0.8376068376068376, + "eval_overall_recall": 0.8698224852071006, + "eval_runtime": 0.8031, + "eval_samples_per_second": 232.851, + "eval_steps_per_second": 3.736, + "step": 9752 + }, + { + "epoch": 93.0, + "grad_norm": 0.0001372557453578338, + "learning_rate": 3.5000000000000004e-06, + "loss": 0.0002, + "step": 9858 + }, + { + "epoch": 93.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.728813559322034, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7166666666666667, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3570501208305359, + "eval_overall_accuracy": 0.9633802816901409, + "eval_overall_f1": 0.8571428571428573, + "eval_overall_precision": 0.8366197183098592, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.8126, + "eval_samples_per_second": 230.138, + "eval_steps_per_second": 3.692, + "step": 9858 + }, + { + "epoch": 94.0, + "grad_norm": 0.00034642827813513577, + "learning_rate": 3e-06, + "loss": 0.0002, + "step": 9964 + }, + { + "epoch": 94.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.728813559322034, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.7166666666666667, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3574298322200775, + "eval_overall_accuracy": 0.9633802816901409, + "eval_overall_f1": 0.8571428571428573, + "eval_overall_precision": 0.8366197183098592, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.8062, + "eval_samples_per_second": 231.955, + "eval_steps_per_second": 3.721, + "step": 9964 + }, + { + "epoch": 95.0, + "grad_norm": 0.0005071151535958052, + "learning_rate": 2.5e-06, + "loss": 0.0004, + "step": 10070 + }, + { + "epoch": 95.0, + "eval_LOCATION_f1": 0.8951048951048951, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8648648648648649, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7166666666666668, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6935483870967742, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.35781243443489075, + "eval_overall_accuracy": 0.9641485275288092, + "eval_overall_f1": 0.8559077809798271, + "eval_overall_precision": 0.8342696629213483, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.8038, + "eval_samples_per_second": 232.657, + "eval_steps_per_second": 3.732, + "step": 10070 + }, + { + "epoch": 96.0, + "grad_norm": 0.000192229199456051, + "learning_rate": 2.0000000000000003e-06, + "loss": 0.0003, + "step": 10176 + }, + { + "epoch": 96.0, + "eval_LOCATION_f1": 0.8951048951048951, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8648648648648649, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7166666666666668, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6935483870967742, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.8961038961038961, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8846153846153846, + "eval_PERSON_recall": 0.9078947368421053, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.35879892110824585, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.8530259365994237, + "eval_overall_precision": 0.8314606741573034, + "eval_overall_recall": 0.8757396449704142, + "eval_runtime": 0.8034, + "eval_samples_per_second": 232.77, + "eval_steps_per_second": 3.734, + "step": 10176 + }, + { + "epoch": 97.0, + "grad_norm": 0.00012044800678268075, + "learning_rate": 1.5e-06, + "loss": 0.0004, + "step": 10282 + }, + { + "epoch": 97.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7166666666666668, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6935483870967742, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3565698266029358, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.8546762589928059, + "eval_overall_precision": 0.8319327731092437, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.8012, + "eval_samples_per_second": 233.392, + "eval_steps_per_second": 3.744, + "step": 10282 + }, + { + "epoch": 98.0, + "grad_norm": 0.0002169125946238637, + "learning_rate": 1.0000000000000002e-06, + "loss": 0.0003, + "step": 10388 + }, + { + "epoch": 98.0, + "eval_LOCATION_f1": 0.888888888888889, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8533333333333334, + "eval_LOCATION_recall": 0.927536231884058, + "eval_ORGANIZATION_f1": 0.7107438016528926, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6825396825396826, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3576311767101288, + "eval_overall_accuracy": 0.9636363636363636, + "eval_overall_f1": 0.8534482758620691, + "eval_overall_precision": 0.8296089385474861, + "eval_overall_recall": 0.878698224852071, + "eval_runtime": 0.7986, + "eval_samples_per_second": 234.172, + "eval_steps_per_second": 3.757, + "step": 10388 + }, + { + "epoch": 99.0, + "grad_norm": 0.0006560708279721439, + "learning_rate": 5.000000000000001e-07, + "loss": 0.0004, + "step": 10494 + }, + { + "epoch": 99.0, + "eval_LOCATION_f1": 0.8965517241379309, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8552631578947368, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7166666666666668, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6935483870967742, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.3574199676513672, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.8563218390804598, + "eval_overall_precision": 0.8324022346368715, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.7986, + "eval_samples_per_second": 234.152, + "eval_steps_per_second": 3.756, + "step": 10494 + }, + { + "epoch": 100.0, + "grad_norm": 0.0002968113112729043, + "learning_rate": 0.0, + "loss": 0.0002, + "step": 10600 + }, + { + "epoch": 100.0, + "eval_LOCATION_f1": 0.8965517241379309, + "eval_LOCATION_number": 69, + "eval_LOCATION_precision": 0.8552631578947368, + "eval_LOCATION_recall": 0.9420289855072463, + "eval_ORGANIZATION_f1": 0.7166666666666668, + "eval_ORGANIZATION_number": 58, + "eval_ORGANIZATION_precision": 0.6935483870967742, + "eval_ORGANIZATION_recall": 0.7413793103448276, + "eval_PERSON_f1": 0.9025974025974026, + "eval_PERSON_number": 152, + "eval_PERSON_precision": 0.8910256410256411, + "eval_PERSON_recall": 0.9144736842105263, + "eval_QUANTITY_f1": 0.8387096774193549, + "eval_QUANTITY_number": 30, + "eval_QUANTITY_precision": 0.8125, + "eval_QUANTITY_recall": 0.8666666666666667, + "eval_TIME_f1": 0.8196721311475409, + "eval_TIME_number": 29, + "eval_TIME_precision": 0.78125, + "eval_TIME_recall": 0.8620689655172413, + "eval_loss": 0.35746997594833374, + "eval_overall_accuracy": 0.9638924455825865, + "eval_overall_f1": 0.8563218390804598, + "eval_overall_precision": 0.8324022346368715, + "eval_overall_recall": 0.8816568047337278, + "eval_runtime": 0.8145, + "eval_samples_per_second": 229.593, + "eval_steps_per_second": 3.683, + "step": 10600 + }, + { + "epoch": 100.0, + "step": 10600, + "total_flos": 4488439619319522.0, + "train_loss": 0.00870023393810217, + "train_runtime": 2597.4084, + "train_samples_per_second": 64.949, + "train_steps_per_second": 4.081 } ], "logging_steps": 500, - "max_steps": 2120, + "max_steps": 10600, "num_input_tokens_seen": 0, - "num_train_epochs": 20, + "num_train_epochs": 100, "save_steps": 500, - "total_flos": 896507603456604.0, + "total_flos": 4488439619319522.0, "train_batch_size": 16, "trial_name": null, "trial_params": null