{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 1.5824520587921143, "learning_rate": 4.9500000000000004e-05, "loss": 0.9315, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.012987012987012988, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.25, "eval_PERSON_recall": 0.006666666666666667, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 34, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.6119179725646973, "eval_overall_accuracy": 0.8370662072360325, "eval_overall_f1": 0.005633802816901409, "eval_overall_precision": 0.25, "eval_overall_recall": 0.002849002849002849, "eval_runtime": 0.3369, "eval_samples_per_second": 555.024, "eval_steps_per_second": 8.904, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.5226932764053345, "learning_rate": 4.9e-05, "loss": 0.5353, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.40983606557377056, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.5102040816326531, "eval_LOCATION_recall": 0.3424657534246575, "eval_ORGANIZATION_f1": 0.08695652173913043, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.1, "eval_ORGANIZATION_recall": 0.07692307692307693, "eval_PERSON_f1": 0.574468085106383, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.4778761061946903, "eval_PERSON_recall": 0.72, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.5483870967741935, "eval_TIME_number": 34, "eval_TIME_precision": 0.6071428571428571, "eval_TIME_recall": 0.5, "eval_loss": 0.411459743976593, "eval_overall_accuracy": 0.8924440068914595, "eval_overall_f1": 0.4397163120567376, "eval_overall_precision": 0.4378531073446328, "eval_overall_recall": 0.4415954415954416, "eval_runtime": 0.3252, "eval_samples_per_second": 574.99, "eval_steps_per_second": 9.224, "step": 212 }, { "epoch": 3.0, "grad_norm": 1.2673431634902954, "learning_rate": 4.85e-05, "loss": 0.3686, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.5747126436781609, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.49504950495049505, "eval_LOCATION_recall": 0.684931506849315, "eval_ORGANIZATION_f1": 0.45528455284552843, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.4827586206896552, "eval_ORGANIZATION_recall": 0.4307692307692308, "eval_PERSON_f1": 0.7507163323782233, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.6582914572864321, "eval_PERSON_recall": 0.8733333333333333, "eval_QUANTITY_f1": 0.3934426229508197, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.375, "eval_QUANTITY_recall": 0.41379310344827586, "eval_TIME_f1": 0.8115942028985507, "eval_TIME_number": 34, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8235294117647058, "eval_loss": 0.29026341438293457, "eval_overall_accuracy": 0.9288702928870293, "eval_overall_f1": 0.6417525773195876, "eval_overall_precision": 0.5858823529411765, "eval_overall_recall": 0.7094017094017094, "eval_runtime": 0.3326, "eval_samples_per_second": 562.209, "eval_steps_per_second": 9.019, "step": 318 }, { "epoch": 4.0, "grad_norm": 1.4100310802459717, "learning_rate": 4.8e-05, "loss": 0.2668, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.5664739884393063, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.49, "eval_LOCATION_recall": 0.6712328767123288, "eval_ORGANIZATION_f1": 0.4878048780487805, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5172413793103449, "eval_ORGANIZATION_recall": 0.46153846153846156, "eval_PERSON_f1": 0.8246153846153845, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7657142857142857, "eval_PERSON_recall": 0.8933333333333333, "eval_QUANTITY_f1": 0.5245901639344263, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.5, "eval_QUANTITY_recall": 0.5517241379310345, "eval_TIME_f1": 0.8823529411764706, "eval_TIME_number": 34, "eval_TIME_precision": 0.8823529411764706, "eval_TIME_recall": 0.8823529411764706, "eval_loss": 0.207948699593544, "eval_overall_accuracy": 0.9401919763721388, "eval_overall_f1": 0.6906666666666667, "eval_overall_precision": 0.6491228070175439, "eval_overall_recall": 0.7378917378917379, "eval_runtime": 0.3333, "eval_samples_per_second": 560.99, "eval_steps_per_second": 9.0, "step": 424 }, { "epoch": 5.0, "grad_norm": 2.0687103271484375, "learning_rate": 4.75e-05, "loss": 0.2091, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.7195121951219512, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.6483516483516484, "eval_LOCATION_recall": 0.8082191780821918, "eval_ORGANIZATION_f1": 0.5714285714285715, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5588235294117647, "eval_ORGANIZATION_recall": 0.5846153846153846, "eval_PERSON_f1": 0.8369230769230769, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7771428571428571, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.5846153846153845, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.5277777777777778, "eval_QUANTITY_recall": 0.6551724137931034, "eval_TIME_f1": 0.8333333333333333, "eval_TIME_number": 34, "eval_TIME_precision": 0.7894736842105263, "eval_TIME_recall": 0.8823529411764706, "eval_loss": 0.17728105187416077, "eval_overall_accuracy": 0.9451144474526212, "eval_overall_f1": 0.7430830039525692, "eval_overall_precision": 0.6911764705882353, "eval_overall_recall": 0.8034188034188035, "eval_runtime": 0.3284, "eval_samples_per_second": 569.476, "eval_steps_per_second": 9.136, "step": 530 }, { "epoch": 6.0, "grad_norm": 2.4117839336395264, "learning_rate": 4.7e-05, "loss": 0.1833, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.6971428571428572, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.5980392156862745, "eval_LOCATION_recall": 0.8356164383561644, "eval_ORGANIZATION_f1": 0.5818181818181819, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.48, "eval_ORGANIZATION_recall": 0.7384615384615385, "eval_PERSON_f1": 0.8353658536585366, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7696629213483146, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.5555555555555556, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.46511627906976744, "eval_QUANTITY_recall": 0.6896551724137931, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.189751997590065, "eval_overall_accuracy": 0.9424070883583558, "eval_overall_f1": 0.7248157248157246, "eval_overall_precision": 0.6371490280777538, "eval_overall_recall": 0.8404558404558404, "eval_runtime": 0.3281, "eval_samples_per_second": 569.94, "eval_steps_per_second": 9.143, "step": 636 }, { "epoch": 7.0, "grad_norm": 1.2822880744934082, "learning_rate": 4.6500000000000005e-05, "loss": 0.1653, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7607361963190183, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.6888888888888889, "eval_LOCATION_recall": 0.8493150684931506, "eval_ORGANIZATION_f1": 0.5857142857142857, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5466666666666666, "eval_ORGANIZATION_recall": 0.6307692307692307, "eval_PERSON_f1": 0.8616352201257862, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8154761904761905, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6666666666666667, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.5945945945945946, "eval_QUANTITY_recall": 0.7586206896551724, "eval_TIME_f1": 0.8450704225352113, "eval_TIME_number": 34, "eval_TIME_precision": 0.8108108108108109, "eval_TIME_recall": 0.8823529411764706, "eval_loss": 0.15423187613487244, "eval_overall_accuracy": 0.9512675363032242, "eval_overall_f1": 0.770448548812665, "eval_overall_precision": 0.7174447174447175, "eval_overall_recall": 0.8319088319088319, "eval_runtime": 0.3338, "eval_samples_per_second": 560.152, "eval_steps_per_second": 8.986, "step": 742 }, { "epoch": 8.0, "grad_norm": 1.469247817993164, "learning_rate": 4.600000000000001e-05, "loss": 0.1529, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7590361445783131, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.6774193548387096, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.5915492957746479, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5454545454545454, "eval_ORGANIZATION_recall": 0.6461538461538462, "eval_PERSON_f1": 0.8500000000000001, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7619047619047619, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.7058823529411765, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.861111111111111, "eval_TIME_number": 34, "eval_TIME_precision": 0.8157894736842105, "eval_TIME_recall": 0.9117647058823529, "eval_loss": 0.14763768017292023, "eval_overall_accuracy": 0.9527442776273689, "eval_overall_f1": 0.7758846657929228, "eval_overall_precision": 0.7184466019417476, "eval_overall_recall": 0.8433048433048433, "eval_runtime": 0.3346, "eval_samples_per_second": 558.898, "eval_steps_per_second": 8.966, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.5628341436386108, "learning_rate": 4.55e-05, "loss": 0.1428, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.7544910179640719, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.6702127659574468, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.6225165562913907, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5465116279069767, "eval_ORGANIZATION_recall": 0.7230769230769231, "eval_PERSON_f1": 0.879746835443038, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8373493975903614, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6666666666666666, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.575, "eval_QUANTITY_recall": 0.7931034482758621, "eval_TIME_f1": 0.8266666666666665, "eval_TIME_number": 34, "eval_TIME_precision": 0.7560975609756098, "eval_TIME_recall": 0.9117647058823529, "eval_loss": 0.14981509745121002, "eval_overall_accuracy": 0.9497907949790795, "eval_overall_f1": 0.7789203084832904, "eval_overall_precision": 0.7096018735362998, "eval_overall_recall": 0.8632478632478633, "eval_runtime": 0.3338, "eval_samples_per_second": 560.163, "eval_steps_per_second": 8.987, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.2276618480682373, "learning_rate": 4.5e-05, "loss": 0.132, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.779874213836478, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7209302325581395, "eval_LOCATION_recall": 0.8493150684931506, "eval_ORGANIZATION_f1": 0.5925925925925927, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5714285714285714, "eval_ORGANIZATION_recall": 0.6153846153846154, "eval_PERSON_f1": 0.8616352201257862, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8154761904761905, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8108108108108107, "eval_TIME_number": 34, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8823529411764706, "eval_loss": 0.14296573400497437, "eval_overall_accuracy": 0.9532365247354172, "eval_overall_f1": 0.7808764940239045, "eval_overall_precision": 0.7313432835820896, "eval_overall_recall": 0.8376068376068376, "eval_runtime": 0.3274, "eval_samples_per_second": 571.224, "eval_steps_per_second": 9.164, "step": 1060 }, { "epoch": 11.0, "grad_norm": 1.8262553215026855, "learning_rate": 4.4500000000000004e-05, "loss": 0.1288, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7515151515151515, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.6739130434782609, "eval_LOCATION_recall": 0.8493150684931506, "eval_ORGANIZATION_f1": 0.6330935251798562, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5945945945945946, "eval_ORGANIZATION_recall": 0.676923076923077, "eval_PERSON_f1": 0.8698412698412699, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8303030303030303, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6956521739130435, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.7631578947368423, "eval_TIME_number": 34, "eval_TIME_precision": 0.6904761904761905, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1460973471403122, "eval_overall_accuracy": 0.9515136598572483, "eval_overall_f1": 0.774869109947644, "eval_overall_precision": 0.7167070217917676, "eval_overall_recall": 0.8433048433048433, "eval_runtime": 0.3342, "eval_samples_per_second": 559.473, "eval_steps_per_second": 8.976, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.1676838397979736, "learning_rate": 4.4000000000000006e-05, "loss": 0.1219, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.7590361445783131, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.6774193548387096, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.6433566433566433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5897435897435898, "eval_ORGANIZATION_recall": 0.7076923076923077, "eval_PERSON_f1": 0.8734177215189873, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8313253012048193, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6153846153846154, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.7631578947368423, "eval_TIME_number": 34, "eval_TIME_precision": 0.6904761904761905, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14986908435821533, "eval_overall_accuracy": 0.9502830420871278, "eval_overall_f1": 0.7802340702210663, "eval_overall_precision": 0.7177033492822966, "eval_overall_recall": 0.8547008547008547, "eval_runtime": 0.333, "eval_samples_per_second": 561.614, "eval_steps_per_second": 9.01, "step": 1272 }, { "epoch": 13.0, "grad_norm": 1.25841224193573, "learning_rate": 4.35e-05, "loss": 0.1176, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.7820512820512822, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8356164383561644, "eval_ORGANIZATION_f1": 0.6666666666666666, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5975609756097561, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13805125653743744, "eval_overall_accuracy": 0.9547132660595619, "eval_overall_f1": 0.7968337730870712, "eval_overall_precision": 0.742014742014742, "eval_overall_recall": 0.8603988603988604, "eval_runtime": 0.3326, "eval_samples_per_second": 562.243, "eval_steps_per_second": 9.02, "step": 1378 }, { "epoch": 14.0, "grad_norm": 1.1619478464126587, "learning_rate": 4.3e-05, "loss": 0.1161, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.782608695652174, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7159090909090909, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.6666666666666666, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5975609756097561, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8761904761904761, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8363636363636363, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7536231884057972, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.896551724137931, "eval_TIME_f1": 0.7631578947368423, "eval_TIME_number": 34, "eval_TIME_precision": 0.6904761904761905, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14077436923980713, "eval_overall_accuracy": 0.9532365247354172, "eval_overall_f1": 0.7942708333333333, "eval_overall_precision": 0.7314148681055156, "eval_overall_recall": 0.8689458689458689, "eval_runtime": 0.3264, "eval_samples_per_second": 572.885, "eval_steps_per_second": 9.191, "step": 1484 }, { "epoch": 15.0, "grad_norm": 1.547819972038269, "learning_rate": 4.25e-05, "loss": 0.1148, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.7777777777777778, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7078651685393258, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7058823529411765, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6136363636363636, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8726114649681529, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7246376811594203, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7733333333333334, "eval_TIME_number": 34, "eval_TIME_precision": 0.7073170731707317, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1482475847005844, "eval_overall_accuracy": 0.9537287718434654, "eval_overall_f1": 0.7968952134540751, "eval_overall_precision": 0.7298578199052133, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3273, "eval_samples_per_second": 571.301, "eval_steps_per_second": 9.165, "step": 1590 }, { "epoch": 16.0, "grad_norm": 3.2295055389404297, "learning_rate": 4.2e-05, "loss": 0.1075, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7590361445783133, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.6268656716417911, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6086956521739131, "eval_ORGANIZATION_recall": 0.6461538461538462, "eval_PERSON_f1": 0.8753993610223643, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8404907975460123, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7142857142857144, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6097560975609756, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7733333333333334, "eval_TIME_number": 34, "eval_TIME_precision": 0.7073170731707317, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14014115929603577, "eval_overall_accuracy": 0.9554516367216342, "eval_overall_f1": 0.7914438502673797, "eval_overall_precision": 0.7455919395465995, "eval_overall_recall": 0.8433048433048433, "eval_runtime": 0.3353, "eval_samples_per_second": 557.692, "eval_steps_per_second": 8.947, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.9571211934089661, "learning_rate": 4.15e-05, "loss": 0.1058, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.7875, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7199999999999999, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6352941176470588, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8761904761904761, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8363636363636363, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7575757575757576, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7631578947368423, "eval_TIME_number": 34, "eval_TIME_precision": 0.6904761904761905, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14074338972568512, "eval_overall_accuracy": 0.9542210189515137, "eval_overall_f1": 0.8057366362451107, "eval_overall_precision": 0.7427884615384616, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3268, "eval_samples_per_second": 572.193, "eval_steps_per_second": 9.18, "step": 1802 }, { "epoch": 18.0, "grad_norm": 1.2484526634216309, "learning_rate": 4.1e-05, "loss": 0.1021, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7590361445783133, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.6433566433566433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5897435897435898, "eval_ORGANIZATION_recall": 0.7076923076923077, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6956521739130435, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13723434507846832, "eval_overall_accuracy": 0.9561900073837066, "eval_overall_f1": 0.7936507936507937, "eval_overall_precision": 0.7407407407407407, "eval_overall_recall": 0.8547008547008547, "eval_runtime": 0.3273, "eval_samples_per_second": 571.38, "eval_steps_per_second": 9.167, "step": 1908 }, { "epoch": 19.0, "grad_norm": 0.977418839931488, "learning_rate": 4.05e-05, "loss": 0.1032, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.8026315789473685, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8356164383561644, "eval_ORGANIZATION_f1": 0.7066666666666667, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7812500000000001, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7733333333333334, "eval_TIME_number": 34, "eval_TIME_precision": 0.7073170731707317, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13176140189170837, "eval_overall_accuracy": 0.958897366477972, "eval_overall_f1": 0.8116710875331565, "eval_overall_precision": 0.7593052109181141, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3289, "eval_samples_per_second": 568.639, "eval_steps_per_second": 9.123, "step": 2014 }, { "epoch": 20.0, "grad_norm": 1.2055819034576416, "learning_rate": 4e-05, "loss": 0.0979, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.7974683544303799, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7412587412587412, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6794871794871795, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1400451809167862, "eval_overall_accuracy": 0.956928378045779, "eval_overall_f1": 0.8132450331125828, "eval_overall_precision": 0.7599009900990099, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3266, "eval_samples_per_second": 572.647, "eval_steps_per_second": 9.187, "step": 2120 }, { "epoch": 21.0, "grad_norm": 2.198835611343384, "learning_rate": 3.9500000000000005e-05, "loss": 0.098, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.8181818181818182, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7777777777777778, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.725925925925926, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13511410355567932, "eval_overall_accuracy": 0.9593896135860202, "eval_overall_f1": 0.8194070080862534, "eval_overall_precision": 0.7774936061381074, "eval_overall_recall": 0.8660968660968661, "eval_runtime": 0.3268, "eval_samples_per_second": 572.204, "eval_steps_per_second": 9.18, "step": 2226 }, { "epoch": 22.0, "grad_norm": 3.7243123054504395, "learning_rate": 3.9000000000000006e-05, "loss": 0.0942, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.7820512820512822, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8356164383561644, "eval_ORGANIZATION_f1": 0.7027027027027027, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6265060240963856, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1375378519296646, "eval_overall_accuracy": 0.9574206251538272, "eval_overall_f1": 0.8085106382978723, "eval_overall_precision": 0.7581047381546134, "eval_overall_recall": 0.8660968660968661, "eval_runtime": 0.3271, "eval_samples_per_second": 571.696, "eval_steps_per_second": 9.172, "step": 2332 }, { "epoch": 23.0, "grad_norm": 1.6769466400146484, "learning_rate": 3.85e-05, "loss": 0.0943, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8493150684931506, "eval_ORGANIZATION_f1": 0.76, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6705882352941176, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13511058688163757, "eval_overall_accuracy": 0.9591434900319961, "eval_overall_f1": 0.8249336870026525, "eval_overall_precision": 0.771712158808933, "eval_overall_recall": 0.886039886039886, "eval_runtime": 0.3273, "eval_samples_per_second": 571.272, "eval_steps_per_second": 9.165, "step": 2438 }, { "epoch": 24.0, "grad_norm": 1.9959501028060913, "learning_rate": 3.8e-05, "loss": 0.091, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.8050314465408805, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7441860465116279, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7682119205298013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6744186046511628, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8753993610223643, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8404907975460123, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14082586765289307, "eval_overall_accuracy": 0.9579128722618755, "eval_overall_f1": 0.8183006535947712, "eval_overall_precision": 0.7560386473429952, "eval_overall_recall": 0.8917378917378918, "eval_runtime": 0.3276, "eval_samples_per_second": 570.878, "eval_steps_per_second": 9.158, "step": 2544 }, { "epoch": 25.0, "grad_norm": 2.225444793701172, "learning_rate": 3.7500000000000003e-05, "loss": 0.089, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7590361445783133, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6883116883116883, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7246376811594203, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1414780169725418, "eval_overall_accuracy": 0.9584051193699237, "eval_overall_f1": 0.8186666666666667, "eval_overall_precision": 0.7694235588972431, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3266, "eval_samples_per_second": 572.607, "eval_steps_per_second": 9.186, "step": 2650 }, { "epoch": 26.0, "grad_norm": 1.2359886169433594, "learning_rate": 3.7e-05, "loss": 0.0862, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.7898089171974523, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8493150684931506, "eval_ORGANIZATION_f1": 0.7194244604316546, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6756756756756757, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7142857142857144, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6097560975609756, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7733333333333334, "eval_TIME_number": 34, "eval_TIME_precision": 0.7073170731707317, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14282022416591644, "eval_overall_accuracy": 0.9561900073837066, "eval_overall_f1": 0.8052980132450331, "eval_overall_precision": 0.7524752475247525, "eval_overall_recall": 0.8660968660968661, "eval_runtime": 0.3275, "eval_samples_per_second": 570.999, "eval_steps_per_second": 9.16, "step": 2756 }, { "epoch": 27.0, "grad_norm": 1.0968230962753296, "learning_rate": 3.65e-05, "loss": 0.0836, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.7950310559006212, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7272727272727273, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7323943661971831, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6753246753246753, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.676056338028169, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.5714285714285714, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.7733333333333334, "eval_TIME_number": 34, "eval_TIME_precision": 0.7073170731707317, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14485140144824982, "eval_overall_accuracy": 0.9556977602756583, "eval_overall_f1": 0.8068331143232589, "eval_overall_precision": 0.748780487804878, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3284, "eval_samples_per_second": 569.433, "eval_steps_per_second": 9.135, "step": 2862 }, { "epoch": 28.0, "grad_norm": 1.7558865547180176, "learning_rate": 3.6e-05, "loss": 0.0801, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8493150684931506, "eval_ORGANIZATION_f1": 0.7338129496402878, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6891891891891891, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13724297285079956, "eval_overall_accuracy": 0.9579128722618755, "eval_overall_f1": 0.8156123822341856, "eval_overall_precision": 0.7729591836734694, "eval_overall_recall": 0.8632478632478633, "eval_runtime": 0.3346, "eval_samples_per_second": 558.811, "eval_steps_per_second": 8.965, "step": 2968 }, { "epoch": 29.0, "grad_norm": 1.0294597148895264, "learning_rate": 3.55e-05, "loss": 0.0779, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.7974683544303799, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7682119205298013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6744186046511628, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1392383724451065, "eval_overall_accuracy": 0.958897366477972, "eval_overall_f1": 0.8236842105263158, "eval_overall_precision": 0.7652811735941321, "eval_overall_recall": 0.8917378917378918, "eval_runtime": 0.3338, "eval_samples_per_second": 560.248, "eval_steps_per_second": 8.988, "step": 3074 }, { "epoch": 30.0, "grad_norm": 1.9617377519607544, "learning_rate": 3.5e-05, "loss": 0.0776, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.725925925925926, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7, "eval_ORGANIZATION_recall": 0.7538461538461538, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13599379360675812, "eval_overall_accuracy": 0.9593896135860202, "eval_overall_f1": 0.8236877523553163, "eval_overall_precision": 0.7806122448979592, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.332, "eval_samples_per_second": 563.281, "eval_steps_per_second": 9.037, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.6533139944076538, "learning_rate": 3.45e-05, "loss": 0.0764, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.8101265822784809, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7529411764705882, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7586206896551724, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7246376811594203, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7733333333333334, "eval_TIME_number": 34, "eval_TIME_precision": 0.7073170731707317, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14058609306812286, "eval_overall_accuracy": 0.9598818606940684, "eval_overall_f1": 0.8173455978975033, "eval_overall_precision": 0.7585365853658537, "eval_overall_recall": 0.886039886039886, "eval_runtime": 0.3334, "eval_samples_per_second": 560.883, "eval_steps_per_second": 8.998, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.820826530456543, "learning_rate": 3.4000000000000007e-05, "loss": 0.0745, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.7974683544303799, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6857142857142856, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.5853658536585366, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8169014084507041, "eval_TIME_number": 34, "eval_TIME_precision": 0.7837837837837838, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1464959979057312, "eval_overall_accuracy": 0.9576667487078513, "eval_overall_f1": 0.8157894736842105, "eval_overall_precision": 0.7579462102689487, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.3329, "eval_samples_per_second": 561.647, "eval_steps_per_second": 9.01, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.9249401688575745, "learning_rate": 3.35e-05, "loss": 0.0729, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.72992700729927, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6944444444444444, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7936507936507937, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13697849214076996, "eval_overall_accuracy": 0.9606202313561408, "eval_overall_f1": 0.8243243243243243, "eval_overall_precision": 0.7840616966580977, "eval_overall_recall": 0.8689458689458689, "eval_runtime": 0.3343, "eval_samples_per_second": 559.37, "eval_steps_per_second": 8.974, "step": 3498 }, { "epoch": 34.0, "grad_norm": 3.431596040725708, "learning_rate": 3.3e-05, "loss": 0.0719, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.8311688311688312, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.6814814814814816, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7076923076923077, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7812500000000001, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1357881724834442, "eval_overall_accuracy": 0.9616047255722373, "eval_overall_f1": 0.819047619047619, "eval_overall_precision": 0.7838541666666666, "eval_overall_recall": 0.8575498575498576, "eval_runtime": 0.3327, "eval_samples_per_second": 562.136, "eval_steps_per_second": 9.018, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.9399017691612244, "learning_rate": 3.2500000000000004e-05, "loss": 0.0746, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.8050314465408805, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7441860465116279, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6626506024096386, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7733333333333334, "eval_TIME_number": 34, "eval_TIME_precision": 0.7073170731707317, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14653536677360535, "eval_overall_accuracy": 0.9574206251538272, "eval_overall_f1": 0.8141361256544503, "eval_overall_precision": 0.7530266343825666, "eval_overall_recall": 0.886039886039886, "eval_runtime": 0.3328, "eval_samples_per_second": 561.886, "eval_steps_per_second": 9.014, "step": 3710 }, { "epoch": 36.0, "grad_norm": 0.6335604190826416, "learning_rate": 3.2000000000000005e-05, "loss": 0.0676, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6883116883116883, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13876868784427643, "eval_overall_accuracy": 0.9603741078021166, "eval_overall_f1": 0.8251001335113485, "eval_overall_precision": 0.7763819095477387, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3328, "eval_samples_per_second": 561.873, "eval_steps_per_second": 9.014, "step": 3816 }, { "epoch": 37.0, "grad_norm": 1.0286895036697388, "learning_rate": 3.15e-05, "loss": 0.0674, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7590361445783133, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6626506024096386, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8761904761904761, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8363636363636363, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14836791157722473, "eval_overall_accuracy": 0.9586512429239479, "eval_overall_f1": 0.8131578947368421, "eval_overall_precision": 0.7555012224938875, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3338, "eval_samples_per_second": 560.202, "eval_steps_per_second": 8.987, "step": 3922 }, { "epoch": 38.0, "grad_norm": 0.754433274269104, "learning_rate": 3.1e-05, "loss": 0.0653, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.6911764705882353, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6619718309859155, "eval_ORGANIZATION_recall": 0.7230769230769231, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1401306837797165, "eval_overall_accuracy": 0.9593896135860202, "eval_overall_f1": 0.8096514745308312, "eval_overall_precision": 0.7645569620253164, "eval_overall_recall": 0.8603988603988604, "eval_runtime": 0.3326, "eval_samples_per_second": 562.239, "eval_steps_per_second": 9.02, "step": 4028 }, { "epoch": 39.0, "grad_norm": 1.2110971212387085, "learning_rate": 3.05e-05, "loss": 0.0638, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8493150684931506, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7575757575757576, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1372911036014557, "eval_overall_accuracy": 0.9608663549101649, "eval_overall_f1": 0.8229027962716379, "eval_overall_precision": 0.7725, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.332, "eval_samples_per_second": 563.249, "eval_steps_per_second": 9.036, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.7484323382377625, "learning_rate": 3e-05, "loss": 0.0641, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.7875, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7241379310344828, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.879746835443038, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8373493975903614, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6857142857142856, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.5853658536585366, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15354810655117035, "eval_overall_accuracy": 0.9566822544917548, "eval_overall_f1": 0.8098958333333335, "eval_overall_precision": 0.7458033573141487, "eval_overall_recall": 0.886039886039886, "eval_runtime": 0.3264, "eval_samples_per_second": 572.882, "eval_steps_per_second": 9.191, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.8354088068008423, "learning_rate": 2.95e-05, "loss": 0.0632, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7801418439716312, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7236842105263158, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7575757575757576, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.13777735829353333, "eval_overall_accuracy": 0.9613586020182131, "eval_overall_f1": 0.8326639892904953, "eval_overall_precision": 0.7853535353535354, "eval_overall_recall": 0.886039886039886, "eval_runtime": 0.333, "eval_samples_per_second": 561.553, "eval_steps_per_second": 9.009, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.5027186274528503, "learning_rate": 2.9e-05, "loss": 0.0607, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8493150684931506, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6883116883116883, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1403217911720276, "eval_overall_accuracy": 0.9606202313561408, "eval_overall_f1": 0.8192771084337349, "eval_overall_precision": 0.7727272727272727, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3336, "eval_samples_per_second": 560.597, "eval_steps_per_second": 8.994, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.9568884968757629, "learning_rate": 2.8499999999999998e-05, "loss": 0.0596, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.8311688311688312, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7323943661971831, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6753246753246753, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1430799663066864, "eval_overall_accuracy": 0.9616047255722373, "eval_overall_f1": 0.8230563002680965, "eval_overall_precision": 0.7772151898734178, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3331, "eval_samples_per_second": 561.433, "eval_steps_per_second": 9.007, "step": 4558 }, { "epoch": 44.0, "grad_norm": 5.6017351150512695, "learning_rate": 2.8000000000000003e-05, "loss": 0.0582, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7375886524822695, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6842105263157895, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.7837837837837837, "eval_TIME_number": 34, "eval_TIME_precision": 0.725, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14417453110218048, "eval_overall_accuracy": 0.961112478464189, "eval_overall_f1": 0.8229027962716379, "eval_overall_precision": 0.7725, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3257, "eval_samples_per_second": 574.07, "eval_steps_per_second": 9.21, "step": 4664 }, { "epoch": 45.0, "grad_norm": 2.356386184692383, "learning_rate": 2.7500000000000004e-05, "loss": 0.0606, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8152866242038217, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.763888888888889, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6962025316455697, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.879746835443038, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8373493975903614, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7246376811594203, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14679183065891266, "eval_overall_accuracy": 0.9596357371400444, "eval_overall_f1": 0.8232189973614775, "eval_overall_precision": 0.7665847665847666, "eval_overall_recall": 0.8888888888888888, "eval_runtime": 0.3259, "eval_samples_per_second": 573.862, "eval_steps_per_second": 9.206, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.9929021000862122, "learning_rate": 2.7000000000000002e-05, "loss": 0.0563, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.8311688311688312, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7285714285714285, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.68, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14097212255001068, "eval_overall_accuracy": 0.9608663549101649, "eval_overall_f1": 0.8219544846050869, "eval_overall_precision": 0.7752525252525253, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.333, "eval_samples_per_second": 561.632, "eval_steps_per_second": 9.01, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.8276335597038269, "learning_rate": 2.6500000000000004e-05, "loss": 0.0556, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.7974683544303799, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7411764705882353, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7724137931034483, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.879746835443038, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8373493975903614, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6857142857142856, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.5853658536585366, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15497690439224243, "eval_overall_accuracy": 0.9579128722618755, "eval_overall_f1": 0.8173455978975033, "eval_overall_precision": 0.7585365853658537, "eval_overall_recall": 0.886039886039886, "eval_runtime": 0.3319, "eval_samples_per_second": 563.4, "eval_steps_per_second": 9.039, "step": 4982 }, { "epoch": 48.0, "grad_norm": 2.3347344398498535, "learning_rate": 2.6000000000000002e-05, "loss": 0.0578, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.8152866242038217, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8825396825396825, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6956521739130435, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.7945205479452054, "eval_TIME_number": 34, "eval_TIME_precision": 0.7435897435897436, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1532071828842163, "eval_overall_accuracy": 0.9576667487078513, "eval_overall_f1": 0.8184210526315789, "eval_overall_precision": 0.7603911980440098, "eval_overall_recall": 0.886039886039886, "eval_runtime": 0.332, "eval_samples_per_second": 563.241, "eval_steps_per_second": 9.036, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.38269466161727905, "learning_rate": 2.5500000000000003e-05, "loss": 0.0559, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.8311688311688312, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7428571428571429, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6933333333333334, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8825396825396825, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14444759488105774, "eval_overall_accuracy": 0.9618508491262614, "eval_overall_f1": 0.8262032085561498, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.332, "eval_samples_per_second": 563.256, "eval_steps_per_second": 9.036, "step": 5194 }, { "epoch": 50.0, "grad_norm": 1.5551215410232544, "learning_rate": 2.5e-05, "loss": 0.0544, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.757142857142857, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7066666666666667, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1467483639717102, "eval_overall_accuracy": 0.9608663549101649, "eval_overall_f1": 0.8266666666666667, "eval_overall_precision": 0.7769423558897243, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.3328, "eval_samples_per_second": 561.888, "eval_steps_per_second": 9.014, "step": 5300 }, { "epoch": 51.0, "grad_norm": 1.1728203296661377, "learning_rate": 2.45e-05, "loss": 0.0511, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7246376811594203, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.684931506849315, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14386440813541412, "eval_overall_accuracy": 0.9608663549101649, "eval_overall_f1": 0.8219544846050869, "eval_overall_precision": 0.7752525252525253, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3262, "eval_samples_per_second": 573.233, "eval_steps_per_second": 9.196, "step": 5406 }, { "epoch": 52.0, "grad_norm": 1.3139925003051758, "learning_rate": 2.4e-05, "loss": 0.0516, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.8152866242038217, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8734177215189873, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8313253012048193, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7575757575757576, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15267647802829742, "eval_overall_accuracy": 0.9596357371400444, "eval_overall_f1": 0.8221343873517786, "eval_overall_precision": 0.7647058823529411, "eval_overall_recall": 0.8888888888888888, "eval_runtime": 0.3328, "eval_samples_per_second": 561.953, "eval_steps_per_second": 9.015, "step": 5512 }, { "epoch": 53.0, "grad_norm": 1.7045568227767944, "learning_rate": 2.35e-05, "loss": 0.0524, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6835443037974683, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8742138364779874, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8273809523809523, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7246376811594203, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15286701917648315, "eval_overall_accuracy": 0.9598818606940684, "eval_overall_f1": 0.8194993412384717, "eval_overall_precision": 0.7622549019607843, "eval_overall_recall": 0.886039886039886, "eval_runtime": 0.3345, "eval_samples_per_second": 559.086, "eval_steps_per_second": 8.969, "step": 5618 }, { "epoch": 54.0, "grad_norm": 2.6849210262298584, "learning_rate": 2.3000000000000003e-05, "loss": 0.0513, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7450980392156863, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6477272727272727, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6153846153846154, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15772588551044464, "eval_overall_accuracy": 0.9576667487078513, "eval_overall_f1": 0.817824377457405, "eval_overall_precision": 0.7572815533980582, "eval_overall_recall": 0.8888888888888888, "eval_runtime": 0.3319, "eval_samples_per_second": 563.4, "eval_steps_per_second": 9.039, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.8173909783363342, "learning_rate": 2.25e-05, "loss": 0.0506, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.8235294117647058, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7428571428571429, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6933333333333334, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8825396825396825, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15098540484905243, "eval_overall_accuracy": 0.9603741078021166, "eval_overall_f1": 0.8219544846050869, "eval_overall_precision": 0.7752525252525253, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3334, "eval_samples_per_second": 560.961, "eval_steps_per_second": 8.999, "step": 5830 }, { "epoch": 56.0, "grad_norm": 1.8647905588150024, "learning_rate": 2.2000000000000003e-05, "loss": 0.0511, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7517730496453899, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6973684210526315, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8825396825396825, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14845135807991028, "eval_overall_accuracy": 0.9606202313561408, "eval_overall_f1": 0.8255659121171771, "eval_overall_precision": 0.775, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.3279, "eval_samples_per_second": 570.365, "eval_steps_per_second": 9.15, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.22929580509662628, "learning_rate": 2.15e-05, "loss": 0.0494, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.8181818181818182, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7777777777777778, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7285714285714285, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.68, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8169014084507041, "eval_TIME_number": 34, "eval_TIME_precision": 0.7837837837837838, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14559510350227356, "eval_overall_accuracy": 0.9618508491262614, "eval_overall_f1": 0.8230563002680965, "eval_overall_precision": 0.7772151898734178, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3268, "eval_samples_per_second": 572.194, "eval_steps_per_second": 9.18, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.6386439800262451, "learning_rate": 2.1e-05, "loss": 0.0494, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.8101265822784809, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7529411764705882, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7391304347826088, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6986301369863014, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15255826711654663, "eval_overall_accuracy": 0.9603741078021166, "eval_overall_f1": 0.8181818181818181, "eval_overall_precision": 0.7707808564231738, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3324, "eval_samples_per_second": 562.613, "eval_steps_per_second": 9.026, "step": 6148 }, { "epoch": 59.0, "grad_norm": 19.432247161865234, "learning_rate": 2.05e-05, "loss": 0.0478, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6626506024096386, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6956521739130435, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1611391305923462, "eval_overall_accuracy": 0.9586512429239479, "eval_overall_f1": 0.8190224570673711, "eval_overall_precision": 0.7635467980295566, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.3315, "eval_samples_per_second": 564.041, "eval_steps_per_second": 9.049, "step": 6254 }, { "epoch": 60.0, "grad_norm": 2.1011621952056885, "learning_rate": 2e-05, "loss": 0.0471, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.8311688311688312, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7901234567901234, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7092198581560285, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6578947368421053, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8169014084507041, "eval_TIME_number": 34, "eval_TIME_precision": 0.7837837837837838, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14900296926498413, "eval_overall_accuracy": 0.9613586020182131, "eval_overall_f1": 0.8214765100671142, "eval_overall_precision": 0.7766497461928934, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3328, "eval_samples_per_second": 561.901, "eval_steps_per_second": 9.014, "step": 6360 }, { "epoch": 61.0, "grad_norm": 1.5730093717575073, "learning_rate": 1.9500000000000003e-05, "loss": 0.0457, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.8366013071895425, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6835443037974683, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7301587301587301, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6764705882352942, "eval_QUANTITY_recall": 0.7931034482758621, "eval_TIME_f1": 0.8285714285714286, "eval_TIME_number": 34, "eval_TIME_precision": 0.8055555555555556, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14521339535713196, "eval_overall_accuracy": 0.9623430962343096, "eval_overall_f1": 0.82907133243607, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3329, "eval_samples_per_second": 561.784, "eval_steps_per_second": 9.013, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.7596818208694458, "learning_rate": 1.9e-05, "loss": 0.0453, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7234042553191491, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6710526315789473, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7575757575757576, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1535465270280838, "eval_overall_accuracy": 0.9608663549101649, "eval_overall_f1": 0.8203753351206434, "eval_overall_precision": 0.7746835443037975, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3263, "eval_samples_per_second": 573.007, "eval_steps_per_second": 9.193, "step": 6572 }, { "epoch": 63.0, "grad_norm": 3.6123743057250977, "learning_rate": 1.85e-05, "loss": 0.0439, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15502122044563293, "eval_overall_accuracy": 0.9596357371400444, "eval_overall_f1": 0.8218085106382977, "eval_overall_precision": 0.770573566084788, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3317, "eval_samples_per_second": 563.702, "eval_steps_per_second": 9.043, "step": 6678 }, { "epoch": 64.0, "grad_norm": 0.6118897199630737, "learning_rate": 1.8e-05, "loss": 0.0467, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.8289473684210525, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.6814814814814816, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6571428571428571, "eval_ORGANIZATION_recall": 0.7076923076923077, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7419354838709677, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.696969696969697, "eval_QUANTITY_recall": 0.7931034482758621, "eval_TIME_f1": 0.8169014084507041, "eval_TIME_number": 34, "eval_TIME_precision": 0.7837837837837838, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.14392048120498657, "eval_overall_accuracy": 0.9613586020182131, "eval_overall_f1": 0.8169398907103825, "eval_overall_precision": 0.7847769028871391, "eval_overall_recall": 0.8518518518518519, "eval_runtime": 0.3318, "eval_samples_per_second": 563.555, "eval_steps_per_second": 9.041, "step": 6784 }, { "epoch": 65.0, "grad_norm": 1.4808624982833862, "learning_rate": 1.75e-05, "loss": 0.0422, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6956521739130435, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.160318523645401, "eval_overall_accuracy": 0.9591434900319961, "eval_overall_f1": 0.8185430463576159, "eval_overall_precision": 0.7648514851485149, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.332, "eval_samples_per_second": 563.291, "eval_steps_per_second": 9.037, "step": 6890 }, { "epoch": 66.0, "grad_norm": 1.028084397315979, "learning_rate": 1.7000000000000003e-05, "loss": 0.0423, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.8152866242038217, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6835443037974683, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7575757575757576, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1588248461484909, "eval_overall_accuracy": 0.9593896135860202, "eval_overall_f1": 0.824468085106383, "eval_overall_precision": 0.773067331670823, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.3263, "eval_samples_per_second": 573.167, "eval_steps_per_second": 9.195, "step": 6996 }, { "epoch": 67.0, "grad_norm": 1.2602914571762085, "learning_rate": 1.65e-05, "loss": 0.0422, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.8441558441558442, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.8024691358024691, "eval_LOCATION_recall": 0.8904109589041096, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8169014084507041, "eval_TIME_number": 34, "eval_TIME_precision": 0.7837837837837838, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15185856819152832, "eval_overall_accuracy": 0.9623430962343096, "eval_overall_f1": 0.8282290279627165, "eval_overall_precision": 0.7775, "eval_overall_recall": 0.886039886039886, "eval_runtime": 0.3269, "eval_samples_per_second": 572.038, "eval_steps_per_second": 9.177, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.7608669996261597, "learning_rate": 1.6000000000000003e-05, "loss": 0.0416, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15464389324188232, "eval_overall_accuracy": 0.9616047255722373, "eval_overall_f1": 0.824468085106383, "eval_overall_precision": 0.773067331670823, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.332, "eval_samples_per_second": 563.246, "eval_steps_per_second": 9.036, "step": 7208 }, { "epoch": 69.0, "grad_norm": 1.0217771530151367, "learning_rate": 1.55e-05, "loss": 0.0403, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.8235294117647058, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7875, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.75, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1511322259902954, "eval_overall_accuracy": 0.9618508491262614, "eval_overall_f1": 0.824631860776439, "eval_overall_precision": 0.7777777777777778, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3329, "eval_samples_per_second": 561.81, "eval_steps_per_second": 9.013, "step": 7314 }, { "epoch": 70.0, "grad_norm": 1.7045354843139648, "learning_rate": 1.5e-05, "loss": 0.0411, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15936115384101868, "eval_overall_accuracy": 0.9598818606940684, "eval_overall_f1": 0.8222811671087533, "eval_overall_precision": 0.7692307692307693, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.3338, "eval_samples_per_second": 560.176, "eval_steps_per_second": 8.987, "step": 7420 }, { "epoch": 71.0, "grad_norm": 1.8637417554855347, "learning_rate": 1.45e-05, "loss": 0.0391, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.8152866242038217, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7225806451612903, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6222222222222222, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.17168858647346497, "eval_overall_accuracy": 0.9561900073837066, "eval_overall_f1": 0.8156862745098039, "eval_overall_precision": 0.7536231884057971, "eval_overall_recall": 0.8888888888888888, "eval_runtime": 0.332, "eval_samples_per_second": 563.182, "eval_steps_per_second": 9.035, "step": 7526 }, { "epoch": 72.0, "grad_norm": 1.0552111864089966, "learning_rate": 1.4000000000000001e-05, "loss": 0.0393, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.8101265822784809, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7529411764705882, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7397260273972603, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16536851227283478, "eval_overall_accuracy": 0.9584051193699237, "eval_overall_f1": 0.8190224570673711, "eval_overall_precision": 0.7635467980295566, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.3264, "eval_samples_per_second": 572.834, "eval_steps_per_second": 9.19, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.6572228670120239, "learning_rate": 1.3500000000000001e-05, "loss": 0.0411, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7323943661971831, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6753246753246753, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15696407854557037, "eval_overall_accuracy": 0.9608663549101649, "eval_overall_f1": 0.822429906542056, "eval_overall_precision": 0.7738693467336684, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3332, "eval_samples_per_second": 561.214, "eval_steps_per_second": 9.003, "step": 7738 }, { "epoch": 74.0, "grad_norm": 0.9044064283370972, "learning_rate": 1.3000000000000001e-05, "loss": 0.0408, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7323943661971831, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6753246753246753, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8169014084507041, "eval_TIME_number": 34, "eval_TIME_precision": 0.7837837837837838, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1582627296447754, "eval_overall_accuracy": 0.9613586020182131, "eval_overall_f1": 0.824, "eval_overall_precision": 0.7744360902255639, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3319, "eval_samples_per_second": 563.385, "eval_steps_per_second": 9.038, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.5799534916877747, "learning_rate": 1.25e-05, "loss": 0.0389, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7310344827586207, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6625, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6153846153846154, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16305667161941528, "eval_overall_accuracy": 0.9591434900319961, "eval_overall_f1": 0.8180610889774236, "eval_overall_precision": 0.7661691542288557, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3349, "eval_samples_per_second": 558.344, "eval_steps_per_second": 8.957, "step": 7950 }, { "epoch": 76.0, "grad_norm": 1.983021855354309, "learning_rate": 1.2e-05, "loss": 0.0377, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.15857818722724915, "eval_overall_accuracy": 0.9613586020182131, "eval_overall_f1": 0.8207171314741036, "eval_overall_precision": 0.7686567164179104, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3261, "eval_samples_per_second": 573.446, "eval_steps_per_second": 9.2, "step": 8056 }, { "epoch": 77.0, "grad_norm": 1.1891909837722778, "learning_rate": 1.1500000000000002e-05, "loss": 0.0404, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16166049242019653, "eval_overall_accuracy": 0.9601279842480925, "eval_overall_f1": 0.8207171314741036, "eval_overall_precision": 0.7686567164179104, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3315, "eval_samples_per_second": 564.102, "eval_steps_per_second": 9.05, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.46722444891929626, "learning_rate": 1.1000000000000001e-05, "loss": 0.0388, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7310344827586207, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6625, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8169014084507041, "eval_TIME_number": 34, "eval_TIME_precision": 0.7837837837837838, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16035309433937073, "eval_overall_accuracy": 0.9618508491262614, "eval_overall_f1": 0.823529411764706, "eval_overall_precision": 0.7758186397984886, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3324, "eval_samples_per_second": 562.645, "eval_steps_per_second": 9.026, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.8686147332191467, "learning_rate": 1.05e-05, "loss": 0.0383, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7183098591549296, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6623376623376623, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7384615384615385, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16000543534755707, "eval_overall_accuracy": 0.961112478464189, "eval_overall_f1": 0.8192771084337349, "eval_overall_precision": 0.7727272727272727, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3327, "eval_samples_per_second": 561.998, "eval_steps_per_second": 9.016, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.674788773059845, "learning_rate": 1e-05, "loss": 0.0382, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.696969696969697, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6216216216216216, "eval_QUANTITY_recall": 0.7931034482758621, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16522908210754395, "eval_overall_accuracy": 0.9596357371400444, "eval_overall_f1": 0.8169761273209548, "eval_overall_precision": 0.7642679900744417, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3342, "eval_samples_per_second": 559.61, "eval_steps_per_second": 8.978, "step": 8480 }, { "epoch": 81.0, "grad_norm": 1.6788341999053955, "learning_rate": 9.5e-06, "loss": 0.0378, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.8101265822784809, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7529411764705882, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7297297297297298, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6153846153846154, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.17060095071792603, "eval_overall_accuracy": 0.9591434900319961, "eval_overall_f1": 0.8153034300791556, "eval_overall_precision": 0.7592137592137592, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3359, "eval_samples_per_second": 556.794, "eval_steps_per_second": 8.933, "step": 8586 }, { "epoch": 82.0, "grad_norm": 0.7395833730697632, "learning_rate": 9e-06, "loss": 0.039, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.8101265822784809, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7529411764705882, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7448275862068966, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.675, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16823621094226837, "eval_overall_accuracy": 0.9598818606940684, "eval_overall_f1": 0.8196286472148541, "eval_overall_precision": 0.7667493796526055, "eval_overall_recall": 0.8803418803418803, "eval_runtime": 0.3356, "eval_samples_per_second": 557.222, "eval_steps_per_second": 8.939, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.7045236229896545, "learning_rate": 8.500000000000002e-06, "loss": 0.0372, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.6944444444444444, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8726114649681529, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16675511002540588, "eval_overall_accuracy": 0.958897366477972, "eval_overall_f1": 0.8095872170439414, "eval_overall_precision": 0.76, "eval_overall_recall": 0.8660968660968661, "eval_runtime": 0.3326, "eval_samples_per_second": 562.306, "eval_steps_per_second": 9.021, "step": 8798 }, { "epoch": 84.0, "grad_norm": 2.7517426013946533, "learning_rate": 8.000000000000001e-06, "loss": 0.0368, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1667993813753128, "eval_overall_accuracy": 0.9598818606940684, "eval_overall_f1": 0.8211920529801325, "eval_overall_precision": 0.7673267326732673, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.3328, "eval_samples_per_second": 561.958, "eval_steps_per_second": 9.015, "step": 8904 }, { "epoch": 85.0, "grad_norm": 2.215299606323242, "learning_rate": 7.5e-06, "loss": 0.0374, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7194244604316546, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6756756756756757, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16433657705783844, "eval_overall_accuracy": 0.9606202313561408, "eval_overall_f1": 0.8176943699731903, "eval_overall_precision": 0.7721518987341772, "eval_overall_recall": 0.8689458689458689, "eval_runtime": 0.3273, "eval_samples_per_second": 571.286, "eval_steps_per_second": 9.165, "step": 9010 }, { "epoch": 86.0, "grad_norm": 0.40606042742729187, "learning_rate": 7.000000000000001e-06, "loss": 0.0369, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7083333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6455696202531646, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6410256410256411, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1689991056919098, "eval_overall_accuracy": 0.9584051193699237, "eval_overall_f1": 0.8154050464807436, "eval_overall_precision": 0.763681592039801, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3328, "eval_samples_per_second": 561.979, "eval_steps_per_second": 9.016, "step": 9116 }, { "epoch": 87.0, "grad_norm": 1.3081475496292114, "learning_rate": 6.5000000000000004e-06, "loss": 0.036, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7132867132867133, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6538461538461539, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16559894382953644, "eval_overall_accuracy": 0.9596357371400444, "eval_overall_f1": 0.8170894526034712, "eval_overall_precision": 0.7688442211055276, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3315, "eval_samples_per_second": 564.057, "eval_steps_per_second": 9.049, "step": 9222 }, { "epoch": 88.0, "grad_norm": 0.7401718497276306, "learning_rate": 6e-06, "loss": 0.037, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7132867132867133, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6538461538461539, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6486486486486487, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16509054601192474, "eval_overall_accuracy": 0.9603741078021166, "eval_overall_f1": 0.8170894526034712, "eval_overall_precision": 0.7688442211055276, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3322, "eval_samples_per_second": 562.977, "eval_steps_per_second": 9.032, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.570732057094574, "learning_rate": 5.500000000000001e-06, "loss": 0.0373, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7172413793103448, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16918015480041504, "eval_overall_accuracy": 0.9593896135860202, "eval_overall_f1": 0.8164893617021275, "eval_overall_precision": 0.7655860349127181, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3273, "eval_samples_per_second": 571.287, "eval_steps_per_second": 9.165, "step": 9434 }, { "epoch": 90.0, "grad_norm": 1.0674538612365723, "learning_rate": 5e-06, "loss": 0.0357, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8258064516129032, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7804878048780488, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7092198581560285, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6578947368421053, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16437728703022003, "eval_overall_accuracy": 0.9603741078021166, "eval_overall_f1": 0.8155080213903743, "eval_overall_precision": 0.7682619647355163, "eval_overall_recall": 0.8689458689458689, "eval_runtime": 0.327, "eval_samples_per_second": 571.778, "eval_steps_per_second": 9.173, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.779975414276123, "learning_rate": 4.5e-06, "loss": 0.0365, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1706375926733017, "eval_overall_accuracy": 0.9596357371400444, "eval_overall_f1": 0.8211920529801325, "eval_overall_precision": 0.7673267326732673, "eval_overall_recall": 0.8831908831908832, "eval_runtime": 0.3328, "eval_samples_per_second": 561.858, "eval_steps_per_second": 9.014, "step": 9646 }, { "epoch": 92.0, "grad_norm": 1.6607707738876343, "learning_rate": 4.000000000000001e-06, "loss": 0.0358, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7210884353741497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6463414634146342, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16552191972732544, "eval_overall_accuracy": 0.9606202313561408, "eval_overall_f1": 0.8158940397350993, "eval_overall_precision": 0.7623762376237624, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3345, "eval_samples_per_second": 559.095, "eval_steps_per_second": 8.969, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.364473819732666, "learning_rate": 3.5000000000000004e-06, "loss": 0.0367, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.8152866242038217, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7272727272727272, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16641728579998016, "eval_overall_accuracy": 0.9593896135860202, "eval_overall_f1": 0.8164893617021275, "eval_overall_precision": 0.7655860349127181, "eval_overall_recall": 0.8746438746438746, "eval_runtime": 0.3264, "eval_samples_per_second": 572.903, "eval_steps_per_second": 9.191, "step": 9858 }, { "epoch": 94.0, "grad_norm": 1.1335537433624268, "learning_rate": 3e-06, "loss": 0.0367, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7590361445783133, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7123287671232877, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6419753086419753, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16745708882808685, "eval_overall_accuracy": 0.958897366477972, "eval_overall_f1": 0.8116710875331565, "eval_overall_precision": 0.7593052109181141, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3331, "eval_samples_per_second": 561.459, "eval_steps_per_second": 9.007, "step": 9964 }, { "epoch": 95.0, "grad_norm": 2.660787582397461, "learning_rate": 2.5e-06, "loss": 0.0358, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.8076923076923077, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7590361445783133, "eval_LOCATION_recall": 0.863013698630137, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7058823529411765, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6153846153846154, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.17253383994102478, "eval_overall_accuracy": 0.9591434900319961, "eval_overall_f1": 0.8148148148148149, "eval_overall_precision": 0.7604938271604939, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3324, "eval_samples_per_second": 562.55, "eval_steps_per_second": 9.025, "step": 10070 }, { "epoch": 96.0, "grad_norm": 1.2606465816497803, "learning_rate": 2.0000000000000003e-06, "loss": 0.0374, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.8152866242038217, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7123287671232877, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6419753086419753, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.746268656716418, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.8620689655172413, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1706884801387787, "eval_overall_accuracy": 0.9593896135860202, "eval_overall_f1": 0.8158940397350993, "eval_overall_precision": 0.7623762376237624, "eval_overall_recall": 0.8774928774928775, "eval_runtime": 0.3336, "eval_samples_per_second": 560.539, "eval_steps_per_second": 8.993, "step": 10176 }, { "epoch": 97.0, "grad_norm": 2.224013090133667, "learning_rate": 1.5e-06, "loss": 0.0342, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7132867132867133, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6538461538461539, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16819004714488983, "eval_overall_accuracy": 0.9593896135860202, "eval_overall_f1": 0.8149134487350199, "eval_overall_precision": 0.765, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.3327, "eval_samples_per_second": 562.071, "eval_steps_per_second": 9.017, "step": 10282 }, { "epoch": 98.0, "grad_norm": 1.7407749891281128, "learning_rate": 1.0000000000000002e-06, "loss": 0.0351, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.8205128205128205, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7710843373493976, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.7234042553191491, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6710526315789473, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16785794496536255, "eval_overall_accuracy": 0.9593896135860202, "eval_overall_f1": 0.8170894526034712, "eval_overall_precision": 0.7688442211055276, "eval_overall_recall": 0.8717948717948718, "eval_runtime": 0.333, "eval_samples_per_second": 561.612, "eval_steps_per_second": 9.01, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.9356883764266968, "learning_rate": 5.000000000000001e-07, "loss": 0.036, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.8152866242038217, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.6993006993006994, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6410256410256411, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.1689637303352356, "eval_overall_accuracy": 0.9586512429239479, "eval_overall_f1": 0.8111702127659575, "eval_overall_precision": 0.7605985037406484, "eval_overall_recall": 0.8689458689458689, "eval_runtime": 0.3253, "eval_samples_per_second": 574.83, "eval_steps_per_second": 9.222, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.6478390693664551, "learning_rate": 0.0, "loss": 0.0368, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.8152866242038217, "eval_LOCATION_number": 73, "eval_LOCATION_precision": 0.7619047619047619, "eval_LOCATION_recall": 0.8767123287671232, "eval_ORGANIZATION_f1": 0.6993006993006994, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6410256410256411, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.716417910447761, "eval_QUANTITY_number": 29, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.8275862068965517, "eval_TIME_f1": 0.8055555555555555, "eval_TIME_number": 34, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.8529411764705882, "eval_loss": 0.16865810751914978, "eval_overall_accuracy": 0.9586512429239479, "eval_overall_f1": 0.8111702127659575, "eval_overall_precision": 0.7605985037406484, "eval_overall_recall": 0.8689458689458689, "eval_runtime": 0.3331, "eval_samples_per_second": 561.343, "eval_steps_per_second": 9.006, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 4567780799240064.0, "train_loss": 0.08414012978661735, "train_runtime": 604.7606, "train_samples_per_second": 279.119, "train_steps_per_second": 17.528 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 4567780799240064.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }