{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 1.1115612983703613, "learning_rate": 4.9500000000000004e-05, "loss": 0.9255, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.012820512820512818, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.25, "eval_PERSON_recall": 0.006578947368421052, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 29, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.6139789819717407, "eval_overall_accuracy": 0.8402048655569783, "eval_overall_f1": 0.005847953216374269, "eval_overall_precision": 0.25, "eval_overall_recall": 0.0029585798816568047, "eval_runtime": 0.288, "eval_samples_per_second": 649.255, "eval_steps_per_second": 10.416, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.1083379983901978, "learning_rate": 4.9e-05, "loss": 0.5503, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.09523809523809525, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.26666666666666666, "eval_LOCATION_recall": 0.057971014492753624, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.5272727272727272, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.4887640449438202, "eval_PERSON_recall": 0.5723684210526315, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.4, "eval_TIME_number": 29, "eval_TIME_precision": 0.5625, "eval_TIME_recall": 0.3103448275862069, "eval_loss": 0.3994744122028351, "eval_overall_accuracy": 0.8855313700384123, "eval_overall_f1": 0.35714285714285715, "eval_overall_precision": 0.45045045045045046, "eval_overall_recall": 0.2958579881656805, "eval_runtime": 0.2908, "eval_samples_per_second": 642.974, "eval_steps_per_second": 10.315, "step": 212 }, { "epoch": 3.0, "grad_norm": 1.8157479763031006, "learning_rate": 4.85e-05, "loss": 0.3808, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.5454545454545455, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.49411764705882355, "eval_LOCATION_recall": 0.6086956521739131, "eval_ORGANIZATION_f1": 0.2978723404255319, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.3888888888888889, "eval_ORGANIZATION_recall": 0.2413793103448276, "eval_PERSON_f1": 0.735632183908046, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.6530612244897959, "eval_PERSON_recall": 0.8421052631578947, "eval_QUANTITY_f1": 0.28571428571428564, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.2727272727272727, "eval_QUANTITY_recall": 0.3, "eval_TIME_f1": 0.6785714285714286, "eval_TIME_number": 29, "eval_TIME_precision": 0.7037037037037037, "eval_TIME_recall": 0.6551724137931034, "eval_loss": 0.28895071148872375, "eval_overall_accuracy": 0.9267605633802817, "eval_overall_f1": 0.5930069930069929, "eval_overall_precision": 0.5623342175066313, "eval_overall_recall": 0.6272189349112426, "eval_runtime": 0.2887, "eval_samples_per_second": 647.772, "eval_steps_per_second": 10.392, "step": 318 }, { "epoch": 4.0, "grad_norm": 1.4652637243270874, "learning_rate": 4.8e-05, "loss": 0.2833, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.6455696202531644, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.5730337078651685, "eval_LOCATION_recall": 0.7391304347826086, "eval_ORGANIZATION_f1": 0.4642857142857143, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.48148148148148145, "eval_ORGANIZATION_recall": 0.4482758620689655, "eval_PERSON_f1": 0.7904191616766467, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.7252747252747253, "eval_PERSON_recall": 0.868421052631579, "eval_QUANTITY_f1": 0.47058823529411764, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.42105263157894735, "eval_QUANTITY_recall": 0.5333333333333333, "eval_TIME_f1": 0.8275862068965517, "eval_TIME_number": 29, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.21562312543392181, "eval_overall_accuracy": 0.9405889884763124, "eval_overall_f1": 0.6821917808219178, "eval_overall_precision": 0.6352040816326531, "eval_overall_recall": 0.7366863905325444, "eval_runtime": 0.2884, "eval_samples_per_second": 648.345, "eval_steps_per_second": 10.401, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.5371237993240356, "learning_rate": 4.75e-05, "loss": 0.2213, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.725, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6373626373626373, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.5263157894736843, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5357142857142857, "eval_ORGANIZATION_recall": 0.5172413793103449, "eval_PERSON_f1": 0.8012048192771084, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.7388888888888889, "eval_PERSON_recall": 0.875, "eval_QUANTITY_f1": 0.5333333333333333, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.4444444444444444, "eval_QUANTITY_recall": 0.6666666666666666, "eval_TIME_f1": 0.8275862068965517, "eval_TIME_number": 29, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.18281985819339752, "eval_overall_accuracy": 0.9434058898847631, "eval_overall_f1": 0.7171853856562923, "eval_overall_precision": 0.6608478802992519, "eval_overall_recall": 0.7840236686390533, "eval_runtime": 0.2945, "eval_samples_per_second": 634.984, "eval_steps_per_second": 10.187, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.388359546661377, "learning_rate": 4.7e-05, "loss": 0.1845, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7721518987341773, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6853932584269663, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.5757575757575758, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5135135135135135, "eval_ORGANIZATION_recall": 0.6551724137931034, "eval_PERSON_f1": 0.8192771084337349, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.7555555555555555, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.5714285714285715, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.5, "eval_QUANTITY_recall": 0.6666666666666666, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1697721779346466, "eval_overall_accuracy": 0.9467349551856594, "eval_overall_f1": 0.7446808510638298, "eval_overall_precision": 0.6763285024154589, "eval_overall_recall": 0.8284023668639053, "eval_runtime": 0.2919, "eval_samples_per_second": 640.647, "eval_steps_per_second": 10.278, "step": 636 }, { "epoch": 7.0, "grad_norm": 0.574262261390686, "learning_rate": 4.6500000000000005e-05, "loss": 0.17, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.8026315789473685, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6016260162601627, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5692307692307692, "eval_ORGANIZATION_recall": 0.6379310344827587, "eval_PERSON_f1": 0.8246153846153845, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.7745664739884393, "eval_PERSON_recall": 0.881578947368421, "eval_QUANTITY_f1": 0.7164179104477612, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1523420363664627, "eval_overall_accuracy": 0.9510883482714468, "eval_overall_f1": 0.7741046831955923, "eval_overall_precision": 0.7242268041237113, "eval_overall_recall": 0.8313609467455622, "eval_runtime": 0.292, "eval_samples_per_second": 640.421, "eval_steps_per_second": 10.274, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.5678428411483765, "learning_rate": 4.600000000000001e-05, "loss": 0.1552, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.8266666666666668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.5891472868217055, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5352112676056338, "eval_ORGANIZATION_recall": 0.6551724137931034, "eval_PERSON_f1": 0.8307692307692307, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.7803468208092486, "eval_PERSON_recall": 0.8881578947368421, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8064516129032258, "eval_TIME_number": 29, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.14812210202217102, "eval_overall_accuracy": 0.9518565941101153, "eval_overall_f1": 0.7759562841530055, "eval_overall_precision": 0.7208121827411168, "eval_overall_recall": 0.8402366863905325, "eval_runtime": 0.2864, "eval_samples_per_second": 652.864, "eval_steps_per_second": 10.474, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.5933927297592163, "learning_rate": 4.55e-05, "loss": 0.1486, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.8299319727891156, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.5853658536585366, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5538461538461539, "eval_ORGANIZATION_recall": 0.6206896551724138, "eval_PERSON_f1": 0.8427672955974843, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8072289156626506, "eval_PERSON_recall": 0.881578947368421, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1388072818517685, "eval_overall_accuracy": 0.9544174135723431, "eval_overall_f1": 0.7860139860139861, "eval_overall_precision": 0.7453580901856764, "eval_overall_recall": 0.8313609467455622, "eval_runtime": 0.2922, "eval_samples_per_second": 640.03, "eval_steps_per_second": 10.268, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.51088547706604, "learning_rate": 4.5e-05, "loss": 0.1369, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.8243243243243245, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6141732283464567, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5652173913043478, "eval_ORGANIZATION_recall": 0.6724137931034483, "eval_PERSON_f1": 0.8348909657320872, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.7928994082840237, "eval_PERSON_recall": 0.881578947368421, "eval_QUANTITY_f1": 0.6956521739130435, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6153846153846154, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8253968253968255, "eval_TIME_number": 29, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.13908080756664276, "eval_overall_accuracy": 0.9549295774647887, "eval_overall_f1": 0.7802197802197802, "eval_overall_precision": 0.7282051282051282, "eval_overall_recall": 0.8402366863905325, "eval_runtime": 0.2918, "eval_samples_per_second": 640.865, "eval_steps_per_second": 10.281, "step": 1060 }, { "epoch": 11.0, "grad_norm": 1.4912283420562744, "learning_rate": 4.4500000000000004e-05, "loss": 0.132, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.8456375838926175, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6299212598425198, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5797101449275363, "eval_ORGANIZATION_recall": 0.6896551724137931, "eval_PERSON_f1": 0.8473520249221184, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8047337278106509, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7812500000000001, "eval_TIME_number": 29, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.14170250296592712, "eval_overall_accuracy": 0.953393085787452, "eval_overall_f1": 0.7928669410150891, "eval_overall_precision": 0.7391304347826086, "eval_overall_recall": 0.8550295857988166, "eval_runtime": 0.2921, "eval_samples_per_second": 640.286, "eval_steps_per_second": 10.272, "step": 1166 }, { "epoch": 12.0, "grad_norm": 2.726284980773926, "learning_rate": 4.4000000000000006e-05, "loss": 0.1268, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.8378378378378378, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.6140350877192983, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.603448275862069, "eval_PERSON_f1": 0.8517350157728707, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8181818181818182, "eval_PERSON_recall": 0.8881578947368421, "eval_QUANTITY_f1": 0.7878787878787877, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.13159815967082977, "eval_overall_accuracy": 0.9577464788732394, "eval_overall_f1": 0.8016997167138811, "eval_overall_precision": 0.7690217391304348, "eval_overall_recall": 0.8372781065088757, "eval_runtime": 0.2918, "eval_samples_per_second": 640.768, "eval_steps_per_second": 10.28, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.7623488903045654, "learning_rate": 4.35e-05, "loss": 0.1206, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6115702479338844, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5873015873015873, "eval_ORGANIZATION_recall": 0.6379310344827587, "eval_PERSON_f1": 0.8526645768025078, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8143712574850299, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.13245752453804016, "eval_overall_accuracy": 0.9574903969270167, "eval_overall_f1": 0.8011204481792716, "eval_overall_precision": 0.7606382978723404, "eval_overall_recall": 0.8461538461538461, "eval_runtime": 0.2913, "eval_samples_per_second": 641.931, "eval_steps_per_second": 10.298, "step": 1378 }, { "epoch": 14.0, "grad_norm": 3.348172664642334, "learning_rate": 4.3e-05, "loss": 0.1186, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.8551724137931034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7299270072992702, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.8620689655172413, "eval_PERSON_f1": 0.8500000000000001, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8095238095238095, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8253968253968255, "eval_TIME_number": 29, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.13963258266448975, "eval_overall_accuracy": 0.9577464788732394, "eval_overall_f1": 0.8158253751705321, "eval_overall_precision": 0.7569620253164557, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2864, "eval_samples_per_second": 652.876, "eval_steps_per_second": 10.474, "step": 1484 }, { "epoch": 15.0, "grad_norm": 1.2007865905761719, "learning_rate": 4.25e-05, "loss": 0.1141, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8266666666666667, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.6333333333333333, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6129032258064516, "eval_ORGANIZATION_recall": 0.6551724137931034, "eval_PERSON_f1": 0.8481012658227848, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8170731707317073, "eval_PERSON_recall": 0.881578947368421, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8064516129032258, "eval_TIME_number": 29, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1281883716583252, "eval_overall_accuracy": 0.9582586427656851, "eval_overall_f1": 0.8022598870056498, "eval_overall_precision": 0.7675675675675676, "eval_overall_recall": 0.8402366863905325, "eval_runtime": 0.2866, "eval_samples_per_second": 652.52, "eval_steps_per_second": 10.468, "step": 1590 }, { "epoch": 16.0, "grad_norm": 0.8597108721733093, "learning_rate": 4.2e-05, "loss": 0.1083, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7131782945736435, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.647887323943662, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8526645768025078, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8143712574850299, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7272727272727272, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8253968253968255, "eval_TIME_number": 29, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1355670541524887, "eval_overall_accuracy": 0.9577464788732394, "eval_overall_f1": 0.8149171270718233, "eval_overall_precision": 0.7642487046632125, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.2918, "eval_samples_per_second": 640.866, "eval_steps_per_second": 10.281, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.9207751154899597, "learning_rate": 4.15e-05, "loss": 0.1106, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6612903225806452, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6212121212121212, "eval_ORGANIZATION_recall": 0.7068965517241379, "eval_PERSON_f1": 0.8517350157728707, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8181818181818182, "eval_PERSON_recall": 0.8881578947368421, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8064516129032258, "eval_TIME_number": 29, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1327420026063919, "eval_overall_accuracy": 0.9585147247119078, "eval_overall_f1": 0.8089260808926082, "eval_overall_precision": 0.7651715039577837, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.2911, "eval_samples_per_second": 642.326, "eval_steps_per_second": 10.305, "step": 1802 }, { "epoch": 18.0, "grad_norm": 2.323946952819824, "learning_rate": 4.1e-05, "loss": 0.1053, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6611570247933884, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6349206349206349, "eval_ORGANIZATION_recall": 0.6896551724137931, "eval_PERSON_f1": 0.8500000000000001, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8095238095238095, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7246376811594204, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7936507936507937, "eval_TIME_number": 29, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1359253227710724, "eval_overall_accuracy": 0.9580025608194622, "eval_overall_f1": 0.8044382801664354, "eval_overall_precision": 0.7571801566579635, "eval_overall_recall": 0.8579881656804734, "eval_runtime": 0.2865, "eval_samples_per_second": 652.807, "eval_steps_per_second": 10.473, "step": 1908 }, { "epoch": 19.0, "grad_norm": 24.915828704833984, "learning_rate": 4.05e-05, "loss": 0.1089, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.8450704225352113, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.821917808219178, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.584070796460177, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.5689655172413793, "eval_PERSON_f1": 0.8471337579617835, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.875, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.12435611337423325, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8023088023088024, "eval_overall_precision": 0.7830985915492957, "eval_overall_recall": 0.8224852071005917, "eval_runtime": 0.2922, "eval_samples_per_second": 640.081, "eval_steps_per_second": 10.269, "step": 2014 }, { "epoch": 20.0, "grad_norm": 0.8912884593009949, "learning_rate": 4e-05, "loss": 0.1046, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.863013698630137, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8181818181818182, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.6779661016949153, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.6896551724137931, "eval_PERSON_f1": 0.85625, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8154761904761905, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.12911909818649292, "eval_overall_accuracy": 0.9600512163892445, "eval_overall_f1": 0.8117977528089887, "eval_overall_precision": 0.7727272727272727, "eval_overall_recall": 0.8550295857988166, "eval_runtime": 0.2932, "eval_samples_per_second": 637.792, "eval_steps_per_second": 10.232, "step": 2120 }, { "epoch": 21.0, "grad_norm": 0.48920294642448425, "learning_rate": 3.9500000000000005e-05, "loss": 0.0965, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.84, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7777777777777778, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7424242424242424, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6621621621621622, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.875, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8333333333333334, "eval_PERSON_recall": 0.9210526315789473, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 29, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1389300525188446, "eval_overall_accuracy": 0.9572343149807938, "eval_overall_f1": 0.8246575342465754, "eval_overall_precision": 0.7678571428571429, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.2936, "eval_samples_per_second": 637.017, "eval_steps_per_second": 10.22, "step": 2226 }, { "epoch": 22.0, "grad_norm": 1.2225427627563477, "learning_rate": 3.9000000000000006e-05, "loss": 0.0958, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7633587786259542, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.684931506849315, "eval_ORGANIZATION_recall": 0.8620689655172413, "eval_PERSON_f1": 0.8544303797468354, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.823170731707317, "eval_PERSON_recall": 0.8881578947368421, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1278899759054184, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8328690807799444, "eval_overall_precision": 0.7868421052631579, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2942, "eval_samples_per_second": 635.574, "eval_steps_per_second": 10.196, "step": 2332 }, { "epoch": 23.0, "grad_norm": 0.5433982014656067, "learning_rate": 3.85e-05, "loss": 0.0929, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8591549295774648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8356164383561644, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6499999999999999, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6290322580645161, "eval_ORGANIZATION_recall": 0.6724137931034483, "eval_PERSON_f1": 0.8616352201257862, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8253012048192772, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.12278664112091064, "eval_overall_accuracy": 0.9628681177976952, "eval_overall_f1": 0.8176638176638177, "eval_overall_precision": 0.7884615384615384, "eval_overall_recall": 0.849112426035503, "eval_runtime": 0.2929, "eval_samples_per_second": 638.552, "eval_steps_per_second": 10.244, "step": 2438 }, { "epoch": 24.0, "grad_norm": 1.4073636531829834, "learning_rate": 3.8e-05, "loss": 0.0934, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.746268656716418, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6578947368421053, "eval_ORGANIZATION_recall": 0.8620689655172413, "eval_PERSON_f1": 0.8509316770186336, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8058823529411765, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8196721311475409, "eval_TIME_number": 29, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.13569365441799164, "eval_overall_accuracy": 0.9595390524967989, "eval_overall_f1": 0.8285322359396433, "eval_overall_precision": 0.7723785166240409, "eval_overall_recall": 0.893491124260355, "eval_runtime": 0.2923, "eval_samples_per_second": 639.683, "eval_steps_per_second": 10.262, "step": 2544 }, { "epoch": 25.0, "grad_norm": 2.3010127544403076, "learning_rate": 3.7500000000000003e-05, "loss": 0.0887, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.8435374149659864, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7948717948717948, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7166666666666668, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6935483870967742, "eval_ORGANIZATION_recall": 0.7413793103448276, "eval_PERSON_f1": 0.8535031847133758, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8271604938271605, "eval_PERSON_recall": 0.881578947368421, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.12316982448101044, "eval_overall_accuracy": 0.9615877080665813, "eval_overall_f1": 0.8198581560283689, "eval_overall_precision": 0.7874659400544959, "eval_overall_recall": 0.8550295857988166, "eval_runtime": 0.2928, "eval_samples_per_second": 638.601, "eval_steps_per_second": 10.245, "step": 2650 }, { "epoch": 26.0, "grad_norm": 1.5638922452926636, "learning_rate": 3.7e-05, "loss": 0.1025, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7716535433070866, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7101449275362319, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.8616352201257862, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8253012048192772, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1349707692861557, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8312412831241283, "eval_overall_precision": 0.7862796833773087, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.2929, "eval_samples_per_second": 638.525, "eval_steps_per_second": 10.244, "step": 2756 }, { "epoch": 27.0, "grad_norm": 1.3527199029922485, "learning_rate": 3.65e-05, "loss": 0.0868, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7777777777777778, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7205882352941176, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 29, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1333594173192978, "eval_overall_accuracy": 0.9613316261203585, "eval_overall_f1": 0.8328690807799444, "eval_overall_precision": 0.7868421052631579, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2923, "eval_samples_per_second": 639.845, "eval_steps_per_second": 10.265, "step": 2862 }, { "epoch": 28.0, "grad_norm": 2.2402167320251465, "learning_rate": 3.6e-05, "loss": 0.0836, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8616352201257862, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8253012048192772, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7419354838709677, "eval_TIME_number": 29, "eval_TIME_precision": 0.696969696969697, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.1318032443523407, "eval_overall_accuracy": 0.9620998719590269, "eval_overall_f1": 0.8212290502793296, "eval_overall_precision": 0.7777777777777778, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.2923, "eval_samples_per_second": 639.756, "eval_steps_per_second": 10.263, "step": 2968 }, { "epoch": 29.0, "grad_norm": 1.1857041120529175, "learning_rate": 3.55e-05, "loss": 0.0791, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.8513513513513514, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.746031746031746, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6911764705882353, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.85625, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8154761904761905, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13442517817020416, "eval_overall_accuracy": 0.9618437900128041, "eval_overall_f1": 0.8256624825662484, "eval_overall_precision": 0.7810026385224275, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2926, "eval_samples_per_second": 639.174, "eval_steps_per_second": 10.254, "step": 3074 }, { "epoch": 30.0, "grad_norm": 0.6588788032531738, "learning_rate": 3.5e-05, "loss": 0.0792, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7058823529411765, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6885245901639344, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8643533123028391, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8303030303030303, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.12328661233186722, "eval_overall_accuracy": 0.9651728553137003, "eval_overall_f1": 0.8312056737588652, "eval_overall_precision": 0.7983651226158038, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.287, "eval_samples_per_second": 651.586, "eval_steps_per_second": 10.453, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.4727123975753784, "learning_rate": 3.45e-05, "loss": 0.0772, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7317073170731708, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6923076923076923, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8652037617554859, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8263473053892215, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1277562379837036, "eval_overall_accuracy": 0.9646606914212548, "eval_overall_f1": 0.8326300984528833, "eval_overall_precision": 0.7935656836461126, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2916, "eval_samples_per_second": 641.192, "eval_steps_per_second": 10.287, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.8663144111633301, "learning_rate": 3.4000000000000007e-05, "loss": 0.0766, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7244094488188977, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8544303797468354, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.823170731707317, "eval_PERSON_recall": 0.8881578947368421, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.12748569250106812, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8258426966292135, "eval_overall_precision": 0.786096256684492, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.287, "eval_samples_per_second": 651.573, "eval_steps_per_second": 10.453, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.6088622808456421, "learning_rate": 3.35e-05, "loss": 0.0746, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7401574803149606, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6811594202898551, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8507936507936509, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8220858895705522, "eval_PERSON_recall": 0.881578947368421, "eval_QUANTITY_f1": 0.8253968253968254, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13140520453453064, "eval_overall_accuracy": 0.9636363636363636, "eval_overall_f1": 0.8286516853932584, "eval_overall_precision": 0.7887700534759359, "eval_overall_recall": 0.8727810650887574, "eval_runtime": 0.293, "eval_samples_per_second": 638.168, "eval_steps_per_second": 10.238, "step": 3498 }, { "epoch": 34.0, "grad_norm": 1.8929836750030518, "learning_rate": 3.3e-05, "loss": 0.072, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7559055118110236, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6956521739130435, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8626198083067094, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8385093167701864, "eval_PERSON_recall": 0.8881578947368421, "eval_QUANTITY_f1": 0.8253968253968254, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13353487849235535, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8366197183098592, "eval_overall_precision": 0.7983870967741935, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.293, "eval_samples_per_second": 638.242, "eval_steps_per_second": 10.239, "step": 3604 }, { "epoch": 35.0, "grad_norm": 1.197149634361267, "learning_rate": 3.2500000000000004e-05, "loss": 0.0712, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7377049180327868, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.703125, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8625, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8214285714285714, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.13137878477573395, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8347338935574229, "eval_overall_precision": 0.7925531914893617, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.2864, "eval_samples_per_second": 652.975, "eval_steps_per_second": 10.476, "step": 3710 }, { "epoch": 36.0, "grad_norm": 0.49242687225341797, "learning_rate": 3.2000000000000005e-05, "loss": 0.0702, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8266666666666667, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7230769230769231, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6527777777777778, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8626198083067094, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8385093167701864, "eval_PERSON_recall": 0.8881578947368421, "eval_QUANTITY_f1": 0.8253968253968254, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 29, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13032355904579163, "eval_overall_accuracy": 0.9641485275288092, "eval_overall_f1": 0.8293370944992947, "eval_overall_precision": 0.7924528301886793, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.2939, "eval_samples_per_second": 636.252, "eval_steps_per_second": 10.207, "step": 3816 }, { "epoch": 37.0, "grad_norm": 2.0146589279174805, "learning_rate": 3.15e-05, "loss": 0.0695, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7580645161290323, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7121212121212122, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8616352201257862, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8253012048192772, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.12965013086795807, "eval_overall_accuracy": 0.9649167733674776, "eval_overall_f1": 0.840620592383639, "eval_overall_precision": 0.8032345013477089, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.2929, "eval_samples_per_second": 638.49, "eval_steps_per_second": 10.243, "step": 3922 }, { "epoch": 38.0, "grad_norm": 0.8112408518791199, "learning_rate": 3.1e-05, "loss": 0.0674, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7419354838709677, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.696969696969697, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8706624605678233, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8363636363636363, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1362360268831253, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8363636363636363, "eval_overall_precision": 0.7931034482758621, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2929, "eval_samples_per_second": 638.407, "eval_steps_per_second": 10.242, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.4772998094558716, "learning_rate": 3.05e-05, "loss": 0.0653, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.6942148760330579, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7241379310344828, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.12953267991542816, "eval_overall_accuracy": 0.964404609475032, "eval_overall_f1": 0.8271954674220963, "eval_overall_precision": 0.7934782608695652, "eval_overall_recall": 0.863905325443787, "eval_runtime": 0.2928, "eval_samples_per_second": 638.701, "eval_steps_per_second": 10.247, "step": 4134 }, { "epoch": 40.0, "grad_norm": 1.1962645053863525, "learning_rate": 3e-05, "loss": 0.0637, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.8533333333333333, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8761904761904762, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13492895662784576, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8330995792426368, "eval_overall_precision": 0.792, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2867, "eval_samples_per_second": 652.21, "eval_steps_per_second": 10.463, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.6804232597351074, "learning_rate": 2.95e-05, "loss": 0.0634, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7619047619047619, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7058823529411765, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8742138364779874, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8373493975903614, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.1353294402360916, "eval_overall_accuracy": 0.9651728553137003, "eval_overall_f1": 0.8410689170182841, "eval_overall_precision": 0.8016085790884718, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2941, "eval_samples_per_second": 635.842, "eval_steps_per_second": 10.201, "step": 4346 }, { "epoch": 42.0, "grad_norm": 1.3958626985549927, "learning_rate": 2.9e-05, "loss": 0.0622, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7154471544715447, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.676923076923077, "eval_ORGANIZATION_recall": 0.7586206896551724, "eval_PERSON_f1": 0.8769716088328074, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.13502123951911926, "eval_overall_accuracy": 0.9649167733674776, "eval_overall_f1": 0.8377997179125528, "eval_overall_precision": 0.8005390835579514, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2888, "eval_samples_per_second": 647.481, "eval_steps_per_second": 10.387, "step": 4452 }, { "epoch": 43.0, "grad_norm": 1.7736326456069946, "learning_rate": 2.8499999999999998e-05, "loss": 0.0616, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.752, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7014925373134329, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8742138364779874, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8373493975903614, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1341027021408081, "eval_overall_accuracy": 0.9654289372599232, "eval_overall_f1": 0.8455056179775281, "eval_overall_precision": 0.8048128342245989, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.2927, "eval_samples_per_second": 638.914, "eval_steps_per_second": 10.25, "step": 4558 }, { "epoch": 44.0, "grad_norm": 4.0435028076171875, "learning_rate": 2.8000000000000003e-05, "loss": 0.0603, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.8476821192052981, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7286821705426356, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6619718309859155, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8714733542319749, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8323353293413174, "eval_PERSON_recall": 0.9144736842105263, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.14106552302837372, "eval_overall_accuracy": 0.9628681177976952, "eval_overall_f1": 0.8310249307479224, "eval_overall_precision": 0.78125, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.2883, "eval_samples_per_second": 648.632, "eval_steps_per_second": 10.406, "step": 4664 }, { "epoch": 45.0, "grad_norm": 1.2470722198486328, "learning_rate": 2.7500000000000004e-05, "loss": 0.0597, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7286821705426356, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6619718309859155, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8652037617554859, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8263473053892215, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14016938209533691, "eval_overall_accuracy": 0.9620998719590269, "eval_overall_f1": 0.8243430152143846, "eval_overall_precision": 0.7740259740259741, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.2928, "eval_samples_per_second": 638.618, "eval_steps_per_second": 10.245, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.7653511762619019, "learning_rate": 2.7000000000000002e-05, "loss": 0.059, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.736, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6865671641791045, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8670886075949367, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.13417667150497437, "eval_overall_accuracy": 0.9649167733674776, "eval_overall_f1": 0.8326300984528833, "eval_overall_precision": 0.7935656836461126, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2925, "eval_samples_per_second": 639.217, "eval_steps_per_second": 10.255, "step": 4876 }, { "epoch": 47.0, "grad_norm": 1.0474615097045898, "learning_rate": 2.6500000000000004e-05, "loss": 0.0574, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.736, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6865671641791045, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7796610169491527, "eval_TIME_number": 29, "eval_TIME_precision": 0.7666666666666667, "eval_TIME_recall": 0.7931034482758621, "eval_loss": 0.13553491234779358, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8258426966292135, "eval_overall_precision": 0.786096256684492, "eval_overall_recall": 0.8698224852071006, "eval_runtime": 0.2928, "eval_samples_per_second": 638.657, "eval_steps_per_second": 10.246, "step": 4982 }, { "epoch": 48.0, "grad_norm": 1.1858253479003906, "learning_rate": 2.6000000000000002e-05, "loss": 0.0581, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7377049180327868, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.703125, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8670886075949367, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.13520203530788422, "eval_overall_accuracy": 0.9659411011523688, "eval_overall_f1": 0.8389830508474576, "eval_overall_precision": 0.8027027027027027, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2932, "eval_samples_per_second": 637.868, "eval_steps_per_second": 10.233, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.4307897090911865, "learning_rate": 2.5500000000000003e-05, "loss": 0.0561, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6764705882352942, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8679245283018868, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8313253012048193, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.13861991465091705, "eval_overall_accuracy": 0.9649167733674776, "eval_overall_f1": 0.8398876404494382, "eval_overall_precision": 0.7994652406417112, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2889, "eval_samples_per_second": 647.316, "eval_steps_per_second": 10.385, "step": 5194 }, { "epoch": 50.0, "grad_norm": 0.8664003014564514, "learning_rate": 2.5e-05, "loss": 0.0544, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.736, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6865671641791045, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8471337579617835, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.875, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 29, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.13451269268989563, "eval_overall_accuracy": 0.9651728553137003, "eval_overall_f1": 0.8312056737588652, "eval_overall_precision": 0.7983651226158038, "eval_overall_recall": 0.8668639053254438, "eval_runtime": 0.2869, "eval_samples_per_second": 651.752, "eval_steps_per_second": 10.456, "step": 5300 }, { "epoch": 51.0, "grad_norm": 3.4700815677642822, "learning_rate": 2.45e-05, "loss": 0.0534, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7692307692307692, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6944444444444444, "eval_ORGANIZATION_recall": 0.8620689655172413, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.847457627118644, "eval_TIME_number": 29, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.13688045740127563, "eval_overall_accuracy": 0.9651728553137003, "eval_overall_f1": 0.841514726507714, "eval_overall_precision": 0.8, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.2922, "eval_samples_per_second": 640.064, "eval_steps_per_second": 10.268, "step": 5406 }, { "epoch": 52.0, "grad_norm": 1.2102717161178589, "learning_rate": 2.4e-05, "loss": 0.0521, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7669172932330827, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.68, "eval_ORGANIZATION_recall": 0.8793103448275862, "eval_PERSON_f1": 0.8643533123028391, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8303030303030303, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.14608342945575714, "eval_overall_accuracy": 0.9628681177976952, "eval_overall_f1": 0.8337950138504154, "eval_overall_precision": 0.7838541666666666, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.2926, "eval_samples_per_second": 639.189, "eval_steps_per_second": 10.254, "step": 5512 }, { "epoch": 53.0, "grad_norm": 1.385406732559204, "learning_rate": 2.35e-05, "loss": 0.0524, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.768, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7164179104477612, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8670886075949367, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1376073956489563, "eval_overall_accuracy": 0.9656850192061459, "eval_overall_f1": 0.8410689170182841, "eval_overall_precision": 0.8016085790884718, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2926, "eval_samples_per_second": 639.014, "eval_steps_per_second": 10.252, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.37542441487312317, "learning_rate": 2.3000000000000003e-05, "loss": 0.0494, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7401574803149606, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6811594202898551, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8670886075949367, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.14096996188163757, "eval_overall_accuracy": 0.9659411011523688, "eval_overall_f1": 0.8398876404494382, "eval_overall_precision": 0.7994652406417112, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2945, "eval_samples_per_second": 635.027, "eval_steps_per_second": 10.188, "step": 5724 }, { "epoch": 55.0, "grad_norm": 2.3441622257232666, "learning_rate": 2.25e-05, "loss": 0.0516, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7559055118110236, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6956521739130435, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8670886075949367, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.13822495937347412, "eval_overall_accuracy": 0.9659411011523688, "eval_overall_f1": 0.8455056179775281, "eval_overall_precision": 0.8048128342245989, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.2928, "eval_samples_per_second": 638.657, "eval_steps_per_second": 10.246, "step": 5830 }, { "epoch": 56.0, "grad_norm": 0.9206390976905823, "learning_rate": 2.2000000000000003e-05, "loss": 0.0497, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7200000000000001, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6716417910447762, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8571428571428571, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8282208588957055, "eval_PERSON_recall": 0.8881578947368421, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.13933928310871124, "eval_overall_accuracy": 0.9654289372599232, "eval_overall_f1": 0.8338028169014083, "eval_overall_precision": 0.7956989247311828, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.293, "eval_samples_per_second": 638.123, "eval_steps_per_second": 10.237, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.8336784839630127, "learning_rate": 2.15e-05, "loss": 0.048, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.752, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.7014925373134329, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.14417044818401337, "eval_overall_accuracy": 0.9649167733674776, "eval_overall_f1": 0.8347338935574229, "eval_overall_precision": 0.7925531914893617, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.2919, "eval_samples_per_second": 640.597, "eval_steps_per_second": 10.277, "step": 6042 }, { "epoch": 58.0, "grad_norm": 1.4807782173156738, "learning_rate": 2.1e-05, "loss": 0.0474, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7480916030534351, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6712328767123288, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.8589341692789968, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8203592814371258, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.14203424751758575, "eval_overall_accuracy": 0.9646606914212548, "eval_overall_f1": 0.8372739916550764, "eval_overall_precision": 0.7900262467191601, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.2926, "eval_samples_per_second": 639.123, "eval_steps_per_second": 10.253, "step": 6148 }, { "epoch": 59.0, "grad_norm": 1.1692790985107422, "learning_rate": 2.05e-05, "loss": 0.0447, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6857142857142857, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8643533123028391, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8303030303030303, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1469813734292984, "eval_overall_accuracy": 0.9646606914212548, "eval_overall_f1": 0.8363636363636363, "eval_overall_precision": 0.7931034482758621, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.293, "eval_samples_per_second": 638.282, "eval_steps_per_second": 10.24, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.8121991157531738, "learning_rate": 2e-05, "loss": 0.045, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6764705882352942, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8666666666666667, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.14526785910129547, "eval_overall_accuracy": 0.9649167733674776, "eval_overall_f1": 0.8330995792426368, "eval_overall_precision": 0.792, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2933, "eval_samples_per_second": 637.529, "eval_steps_per_second": 10.228, "step": 6360 }, { "epoch": 61.0, "grad_norm": 0.9558350443840027, "learning_rate": 1.9500000000000003e-05, "loss": 0.0441, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7244094488188977, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1430891752243042, "eval_overall_accuracy": 0.9649167733674776, "eval_overall_f1": 0.8349788434414668, "eval_overall_precision": 0.7978436657681941, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.286, "eval_samples_per_second": 653.776, "eval_steps_per_second": 10.488, "step": 6466 }, { "epoch": 62.0, "grad_norm": 1.2547602653503418, "learning_rate": 1.9e-05, "loss": 0.0474, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8616352201257862, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8253012048192772, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1453644037246704, "eval_overall_accuracy": 0.9646606914212548, "eval_overall_f1": 0.8307692307692308, "eval_overall_precision": 0.7877984084880637, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.286, "eval_samples_per_second": 653.787, "eval_steps_per_second": 10.489, "step": 6572 }, { "epoch": 63.0, "grad_norm": 0.2882705628871918, "learning_rate": 1.85e-05, "loss": 0.0441, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7258064516129032, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6818181818181818, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8706624605678233, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8363636363636363, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.14318965375423431, "eval_overall_accuracy": 0.9651728553137003, "eval_overall_f1": 0.8382559774964837, "eval_overall_precision": 0.7989276139410187, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.2869, "eval_samples_per_second": 651.819, "eval_steps_per_second": 10.457, "step": 6678 }, { "epoch": 64.0, "grad_norm": 1.046625018119812, "learning_rate": 1.8e-05, "loss": 0.0449, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.8590604026845639, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7034482758620689, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.5862068965517241, "eval_ORGANIZATION_recall": 0.8793103448275862, "eval_PERSON_f1": 0.8598130841121495, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8165680473372781, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.7575757575757577, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.16219820082187653, "eval_overall_accuracy": 0.9590268886043534, "eval_overall_f1": 0.8178137651821863, "eval_overall_precision": 0.7518610421836228, "eval_overall_recall": 0.8964497041420119, "eval_runtime": 0.2859, "eval_samples_per_second": 654.058, "eval_steps_per_second": 10.493, "step": 6784 }, { "epoch": 65.0, "grad_norm": 1.8243094682693481, "learning_rate": 1.75e-05, "loss": 0.0452, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7424242424242424, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6621621621621622, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.85625, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8154761904761905, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.14889490604400635, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8349514563106797, "eval_overall_precision": 0.7859007832898173, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.2885, "eval_samples_per_second": 648.163, "eval_steps_per_second": 10.398, "step": 6890 }, { "epoch": 66.0, "grad_norm": 0.7773322463035583, "learning_rate": 1.7000000000000003e-05, "loss": 0.0418, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7480916030534351, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6712328767123288, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.8625, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8214285714285714, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.15430662035942078, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8349514563106797, "eval_overall_precision": 0.7859007832898173, "eval_overall_recall": 0.8905325443786982, "eval_runtime": 0.2923, "eval_samples_per_second": 639.682, "eval_steps_per_second": 10.262, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.9151946306228638, "learning_rate": 1.65e-05, "loss": 0.0421, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7538461538461538, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6805555555555556, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.8589341692789968, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8203592814371258, "eval_PERSON_recall": 0.9013157894736842, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.15378881990909576, "eval_overall_accuracy": 0.963124199743918, "eval_overall_f1": 0.8321775312066575, "eval_overall_precision": 0.783289817232376, "eval_overall_recall": 0.8875739644970414, "eval_runtime": 0.2921, "eval_samples_per_second": 640.251, "eval_steps_per_second": 10.271, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.4768742322921753, "learning_rate": 1.6000000000000003e-05, "loss": 0.041, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7518796992481203, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8620689655172413, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.15490765869617462, "eval_overall_accuracy": 0.9626120358514725, "eval_overall_f1": 0.8294036061026352, "eval_overall_precision": 0.7806788511749347, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2858, "eval_samples_per_second": 654.293, "eval_steps_per_second": 10.497, "step": 7208 }, { "epoch": 69.0, "grad_norm": 1.6758042573928833, "learning_rate": 1.55e-05, "loss": 0.0411, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7401574803149606, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6811594202898551, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8553459119496855, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8192771084337349, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15107131004333496, "eval_overall_accuracy": 0.9651728553137003, "eval_overall_f1": 0.8347338935574229, "eval_overall_precision": 0.7925531914893617, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.2937, "eval_samples_per_second": 636.611, "eval_steps_per_second": 10.213, "step": 7314 }, { "epoch": 70.0, "grad_norm": 1.7515956163406372, "learning_rate": 1.5e-05, "loss": 0.0414, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6764705882352942, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8625, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8214285714285714, "eval_PERSON_recall": 0.9078947368421053, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 29, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8275862068965517, "eval_loss": 0.15384884178638458, "eval_overall_accuracy": 0.963124199743918, "eval_overall_f1": 0.8250000000000001, "eval_overall_precision": 0.7774869109947644, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2872, "eval_samples_per_second": 651.192, "eval_steps_per_second": 10.447, "step": 7420 }, { "epoch": 71.0, "grad_norm": 1.0327603816986084, "learning_rate": 1.45e-05, "loss": 0.0407, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7384615384615385, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1484140008687973, "eval_overall_accuracy": 0.9649167733674776, "eval_overall_f1": 0.8375350140056023, "eval_overall_precision": 0.7952127659574468, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2923, "eval_samples_per_second": 639.759, "eval_steps_per_second": 10.264, "step": 7526 }, { "epoch": 72.0, "grad_norm": 1.021155595779419, "learning_rate": 1.4000000000000001e-05, "loss": 0.0395, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.8749999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.84, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7419354838709677, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.696969696969697, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.14668720960617065, "eval_overall_accuracy": 0.9649167733674776, "eval_overall_f1": 0.8385269121813032, "eval_overall_precision": 0.8043478260869565, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2936, "eval_samples_per_second": 636.931, "eval_steps_per_second": 10.218, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.8261666893959045, "learning_rate": 1.3500000000000001e-05, "loss": 0.0388, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7441860465116279, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.676056338028169, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7936507936507938, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.14678049087524414, "eval_overall_accuracy": 0.9651728553137003, "eval_overall_f1": 0.8387096774193548, "eval_overall_precision": 0.7973333333333333, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2943, "eval_samples_per_second": 635.507, "eval_steps_per_second": 10.195, "step": 7738 }, { "epoch": 74.0, "grad_norm": 1.6623172760009766, "learning_rate": 1.3000000000000001e-05, "loss": 0.0401, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7441860465116279, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.676056338028169, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15321803092956543, "eval_overall_accuracy": 0.9646606914212548, "eval_overall_f1": 0.8363636363636363, "eval_overall_precision": 0.7931034482758621, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2923, "eval_samples_per_second": 639.734, "eval_steps_per_second": 10.263, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.745629608631134, "learning_rate": 1.25e-05, "loss": 0.0376, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15535052120685577, "eval_overall_accuracy": 0.9636363636363636, "eval_overall_f1": 0.829608938547486, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2924, "eval_samples_per_second": 639.471, "eval_steps_per_second": 10.259, "step": 7950 }, { "epoch": 76.0, "grad_norm": 1.3148008584976196, "learning_rate": 1.2e-05, "loss": 0.0389, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7480916030534351, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6712328767123288, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15534979104995728, "eval_overall_accuracy": 0.963124199743918, "eval_overall_f1": 0.8328690807799444, "eval_overall_precision": 0.7868421052631579, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2928, "eval_samples_per_second": 638.704, "eval_steps_per_second": 10.247, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.5751745104789734, "learning_rate": 1.1500000000000002e-05, "loss": 0.0385, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7538461538461538, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6805555555555556, "eval_ORGANIZATION_recall": 0.8448275862068966, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1525815725326538, "eval_overall_accuracy": 0.964404609475032, "eval_overall_f1": 0.835195530726257, "eval_overall_precision": 0.791005291005291, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2918, "eval_samples_per_second": 640.799, "eval_steps_per_second": 10.28, "step": 8162 }, { "epoch": 78.0, "grad_norm": 1.434624195098877, "learning_rate": 1.1000000000000001e-05, "loss": 0.0375, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7286821705426356, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6619718309859155, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15279057621955872, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.829608938547486, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2926, "eval_samples_per_second": 639.034, "eval_steps_per_second": 10.252, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.7510130405426025, "learning_rate": 1.05e-05, "loss": 0.0373, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7244094488188977, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1517334133386612, "eval_overall_accuracy": 0.964404609475032, "eval_overall_f1": 0.8330995792426368, "eval_overall_precision": 0.792, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2862, "eval_samples_per_second": 653.312, "eval_steps_per_second": 10.481, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.686745822429657, "learning_rate": 1e-05, "loss": 0.0375, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7401574803149606, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6811594202898551, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8553459119496855, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8192771084337349, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15770980715751648, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.829608938547486, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2918, "eval_samples_per_second": 640.906, "eval_steps_per_second": 10.282, "step": 8480 }, { "epoch": 81.0, "grad_norm": 2.2296547889709473, "learning_rate": 9.5e-06, "loss": 0.0371, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7384615384615385, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1602996438741684, "eval_overall_accuracy": 0.963124199743918, "eval_overall_f1": 0.8317107093184978, "eval_overall_precision": 0.7847769028871391, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2862, "eval_samples_per_second": 653.41, "eval_steps_per_second": 10.483, "step": 8586 }, { "epoch": 82.0, "grad_norm": 1.0859251022338867, "learning_rate": 9e-06, "loss": 0.0364, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7441860465116279, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.676056338028169, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15970273315906525, "eval_overall_accuracy": 0.9633802816901409, "eval_overall_f1": 0.8328690807799444, "eval_overall_precision": 0.7868421052631579, "eval_overall_recall": 0.8846153846153846, "eval_runtime": 0.2856, "eval_samples_per_second": 654.808, "eval_steps_per_second": 10.505, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.759631872177124, "learning_rate": 8.500000000000002e-06, "loss": 0.0355, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15819035470485687, "eval_overall_accuracy": 0.963124199743918, "eval_overall_f1": 0.8284518828451882, "eval_overall_precision": 0.783641160949868, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2921, "eval_samples_per_second": 640.257, "eval_steps_per_second": 10.271, "step": 8798 }, { "epoch": 84.0, "grad_norm": 3.2821595668792725, "learning_rate": 8.000000000000001e-06, "loss": 0.0352, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.8648648648648648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.810126582278481, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7175572519083969, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6438356164383562, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 29, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8620689655172413, "eval_loss": 0.1597450226545334, "eval_overall_accuracy": 0.9620998719590269, "eval_overall_f1": 0.8210818307905687, "eval_overall_precision": 0.7728459530026109, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2916, "eval_samples_per_second": 641.288, "eval_steps_per_second": 10.288, "step": 8904 }, { "epoch": 85.0, "grad_norm": 1.4578148126602173, "learning_rate": 7.5e-06, "loss": 0.0351, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15464067459106445, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8319327731092437, "eval_overall_precision": 0.7898936170212766, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.291, "eval_samples_per_second": 642.532, "eval_steps_per_second": 10.308, "step": 9010 }, { "epoch": 86.0, "grad_norm": 3.6410322189331055, "learning_rate": 7.000000000000001e-06, "loss": 0.0358, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.882758620689655, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8421052631578947, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7131782945736435, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.647887323943662, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15458884835243225, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8319327731092437, "eval_overall_precision": 0.7898936170212766, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2879, "eval_samples_per_second": 649.619, "eval_steps_per_second": 10.422, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.8341395854949951, "learning_rate": 6.5000000000000004e-06, "loss": 0.0359, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7175572519083969, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6438356164383562, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15657885372638702, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8312412831241283, "eval_overall_precision": 0.7862796833773087, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.2923, "eval_samples_per_second": 639.721, "eval_steps_per_second": 10.263, "step": 9222 }, { "epoch": 88.0, "grad_norm": 2.221242904663086, "learning_rate": 6e-06, "loss": 0.0338, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7086614173228347, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6521739130434783, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15500542521476746, "eval_overall_accuracy": 0.9641485275288092, "eval_overall_f1": 0.8302945301542777, "eval_overall_precision": 0.7893333333333333, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2854, "eval_samples_per_second": 655.275, "eval_steps_per_second": 10.512, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.7178964018821716, "learning_rate": 5.500000000000001e-06, "loss": 0.0324, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.703125, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15786349773406982, "eval_overall_accuracy": 0.9633802816901409, "eval_overall_f1": 0.8256624825662484, "eval_overall_precision": 0.7810026385224275, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2857, "eval_samples_per_second": 654.47, "eval_steps_per_second": 10.5, "step": 9434 }, { "epoch": 90.0, "grad_norm": 1.6527904272079468, "learning_rate": 5e-06, "loss": 0.034, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15783792734146118, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8268156424581006, "eval_overall_precision": 0.783068783068783, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2925, "eval_samples_per_second": 639.316, "eval_steps_per_second": 10.256, "step": 9540 }, { "epoch": 91.0, "grad_norm": 1.0714702606201172, "learning_rate": 4.5e-06, "loss": 0.0353, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7343749999999999, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6714285714285714, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15797153115272522, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.829608938547486, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.286, "eval_samples_per_second": 653.836, "eval_steps_per_second": 10.489, "step": 9646 }, { "epoch": 92.0, "grad_norm": 1.2929750680923462, "learning_rate": 4.000000000000001e-06, "loss": 0.0325, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15651264786720276, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8307692307692308, "eval_overall_precision": 0.7877984084880637, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2929, "eval_samples_per_second": 638.474, "eval_steps_per_second": 10.243, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.8345323801040649, "learning_rate": 3.5000000000000004e-06, "loss": 0.0344, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7343749999999999, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6714285714285714, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1590217500925064, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8284518828451882, "eval_overall_precision": 0.783641160949868, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2919, "eval_samples_per_second": 640.648, "eval_steps_per_second": 10.278, "step": 9858 }, { "epoch": 94.0, "grad_norm": 0.6701174974441528, "learning_rate": 3e-06, "loss": 0.0336, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.8571428571428572, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8076923076923077, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7286821705426356, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6619718309859155, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7500000000000001, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1604832261800766, "eval_overall_accuracy": 0.9633802816901409, "eval_overall_f1": 0.8256624825662484, "eval_overall_precision": 0.7810026385224275, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2864, "eval_samples_per_second": 652.822, "eval_steps_per_second": 10.473, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.5713714361190796, "learning_rate": 2.5e-06, "loss": 0.0337, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7244094488188977, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.16034719347953796, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.829608938547486, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2857, "eval_samples_per_second": 654.607, "eval_steps_per_second": 10.502, "step": 10070 }, { "epoch": 96.0, "grad_norm": 1.4332071542739868, "learning_rate": 2.0000000000000003e-06, "loss": 0.0326, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.703125, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6428571428571429, "eval_ORGANIZATION_recall": 0.7758620689655172, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1593874990940094, "eval_overall_accuracy": 0.9633802816901409, "eval_overall_f1": 0.8256624825662484, "eval_overall_precision": 0.7810026385224275, "eval_overall_recall": 0.8757396449704142, "eval_runtime": 0.2921, "eval_samples_per_second": 640.143, "eval_steps_per_second": 10.27, "step": 10176 }, { "epoch": 97.0, "grad_norm": 1.3420923948287964, "learning_rate": 1.5e-06, "loss": 0.0352, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7244094488188977, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7931034482758621, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8333333333333334, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15942679345607758, "eval_overall_accuracy": 0.9641485275288092, "eval_overall_f1": 0.8307692307692308, "eval_overall_precision": 0.7877984084880637, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2927, "eval_samples_per_second": 638.801, "eval_steps_per_second": 10.248, "step": 10282 }, { "epoch": 98.0, "grad_norm": 2.652052402496338, "learning_rate": 1.0000000000000002e-06, "loss": 0.0329, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.8767123287671235, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8311688311688312, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7343749999999999, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6714285714285714, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1578895002603531, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8307692307692308, "eval_overall_precision": 0.7877984084880637, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2858, "eval_samples_per_second": 654.385, "eval_steps_per_second": 10.498, "step": 10388 }, { "epoch": 99.0, "grad_norm": 1.3167122602462769, "learning_rate": 5.000000000000001e-07, "loss": 0.0321, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6857142857142857, "eval_ORGANIZATION_recall": 0.8275862068965517, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.15904921293258667, "eval_overall_accuracy": 0.9641485275288092, "eval_overall_f1": 0.8324022346368716, "eval_overall_precision": 0.7883597883597884, "eval_overall_recall": 0.8816568047337278, "eval_runtime": 0.293, "eval_samples_per_second": 638.168, "eval_steps_per_second": 10.238, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.26482483744621277, "learning_rate": 0.0, "loss": 0.0322, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.870748299319728, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8205128205128205, "eval_LOCATION_recall": 0.927536231884058, "eval_ORGANIZATION_f1": 0.7343749999999999, "eval_ORGANIZATION_number": 58, "eval_ORGANIZATION_precision": 0.6714285714285714, "eval_ORGANIZATION_recall": 0.8103448275862069, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 152, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.8947368421052632, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 30, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 29, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.896551724137931, "eval_loss": 0.1596968173980713, "eval_overall_accuracy": 0.9638924455825865, "eval_overall_f1": 0.8284518828451882, "eval_overall_precision": 0.783641160949868, "eval_overall_recall": 0.878698224852071, "eval_runtime": 0.2913, "eval_samples_per_second": 641.846, "eval_steps_per_second": 10.297, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 4535639530574946.0, "train_loss": 0.08503569045156803, "train_runtime": 606.7172, "train_samples_per_second": 278.054, "train_steps_per_second": 17.471 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 4535639530574946.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }