{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 1.0541012287139893, "learning_rate": 4.9500000000000004e-05, "loss": 0.9752, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.08743169398907104, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.26666666666666666, "eval_PERSON_recall": 0.05228758169934641, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 31, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.578914225101471, "eval_overall_accuracy": 0.8397324746098588, "eval_overall_f1": 0.041237113402061855, "eval_overall_precision": 0.19047619047619047, "eval_overall_recall": 0.023121387283236993, "eval_runtime": 0.3729, "eval_samples_per_second": 501.424, "eval_steps_per_second": 8.044, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.4303056001663208, "learning_rate": 4.9e-05, "loss": 0.4971, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.36363636363636365, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6, "eval_LOCATION_recall": 0.2608695652173913, "eval_ORGANIZATION_f1": 0.04597701149425287, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.07692307692307693, "eval_ORGANIZATION_recall": 0.03278688524590164, "eval_PERSON_f1": 0.6265060240963856, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.4961832061068702, "eval_PERSON_recall": 0.8496732026143791, "eval_QUANTITY_f1": 0.04081632653061224, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.058823529411764705, "eval_QUANTITY_recall": 0.03125, "eval_TIME_f1": 0.5, "eval_TIME_number": 31, "eval_TIME_precision": 0.4222222222222222, "eval_TIME_recall": 0.6129032258064516, "eval_loss": 0.34586551785469055, "eval_overall_accuracy": 0.8981917265296012, "eval_overall_f1": 0.4683195592286501, "eval_overall_precision": 0.4473684210526316, "eval_overall_recall": 0.4913294797687861, "eval_runtime": 0.3784, "eval_samples_per_second": 494.164, "eval_steps_per_second": 7.928, "step": 212 }, { "epoch": 3.0, "grad_norm": 1.2177335023880005, "learning_rate": 4.85e-05, "loss": 0.3054, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.585635359116022, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.4732142857142857, "eval_LOCATION_recall": 0.7681159420289855, "eval_ORGANIZATION_f1": 0.4705882352941177, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.4266666666666667, "eval_ORGANIZATION_recall": 0.5245901639344263, "eval_PERSON_f1": 0.8168168168168167, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.7555555555555555, "eval_PERSON_recall": 0.8888888888888888, "eval_QUANTITY_f1": 0.5789473684210527, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5, "eval_QUANTITY_recall": 0.6875, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.21867817640304565, "eval_overall_accuracy": 0.9326232350755511, "eval_overall_f1": 0.6834804539722573, "eval_overall_precision": 0.6062639821029083, "eval_overall_recall": 0.7832369942196532, "eval_runtime": 0.3785, "eval_samples_per_second": 494.043, "eval_steps_per_second": 7.926, "step": 318 }, { "epoch": 4.0, "grad_norm": 1.0648493766784668, "learning_rate": 4.8e-05, "loss": 0.2131, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.6951219512195121, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.5774647887323944, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5061728395061729, "eval_ORGANIZATION_recall": 0.6721311475409836, "eval_PERSON_f1": 0.8685015290519879, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8160919540229885, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.5853658536585366, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.48, "eval_QUANTITY_recall": 0.75, "eval_TIME_f1": 0.6753246753246753, "eval_TIME_number": 31, "eval_TIME_precision": 0.5652173913043478, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.18452519178390503, "eval_overall_accuracy": 0.939311369829081, "eval_overall_f1": 0.7323232323232323, "eval_overall_precision": 0.6502242152466368, "eval_overall_recall": 0.838150289017341, "eval_runtime": 0.3868, "eval_samples_per_second": 483.448, "eval_steps_per_second": 7.756, "step": 424 }, { "epoch": 5.0, "grad_norm": 0.82362300157547, "learning_rate": 4.75e-05, "loss": 0.1765, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.728476821192053, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6707317073170732, "eval_LOCATION_recall": 0.7971014492753623, "eval_ORGANIZATION_f1": 0.6620689655172414, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5714285714285714, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.8827160493827161, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8362573099415205, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.1476963609457016, "eval_overall_accuracy": 0.9544216001981669, "eval_overall_f1": 0.796812749003984, "eval_overall_precision": 0.7371007371007371, "eval_overall_recall": 0.8670520231213873, "eval_runtime": 0.3778, "eval_samples_per_second": 494.985, "eval_steps_per_second": 7.941, "step": 530 }, { "epoch": 6.0, "grad_norm": 0.464044988155365, "learning_rate": 4.7e-05, "loss": 0.1544, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.6874999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6043956043956044, "eval_LOCATION_recall": 0.7971014492753623, "eval_ORGANIZATION_f1": 0.6533333333333333, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.550561797752809, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.8881987577639752, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8461538461538461, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.6578947368421052, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5681818181818182, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.75, "eval_TIME_number": 31, "eval_TIME_precision": 0.6585365853658537, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15219637751579285, "eval_overall_accuracy": 0.9477334654446371, "eval_overall_f1": 0.7666666666666667, "eval_overall_precision": 0.6889400921658986, "eval_overall_recall": 0.8641618497109826, "eval_runtime": 0.3744, "eval_samples_per_second": 499.529, "eval_steps_per_second": 8.014, "step": 636 }, { "epoch": 7.0, "grad_norm": 0.4864940345287323, "learning_rate": 4.6500000000000005e-05, "loss": 0.1461, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6976744186046512, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6928104575163399, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5760869565217391, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8881987577639752, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8461538461538461, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.7297297297297298, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.14314229786396027, "eval_overall_accuracy": 0.9554124349764677, "eval_overall_f1": 0.8077922077922078, "eval_overall_precision": 0.7334905660377359, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3767, "eval_samples_per_second": 496.387, "eval_steps_per_second": 7.963, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.7082120180130005, "learning_rate": 4.600000000000001e-05, "loss": 0.1374, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7037037037037037, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.7123287671232876, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.611764705882353, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.8792569659442725, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8352941176470589, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7397260273972603, "eval_TIME_number": 31, "eval_TIME_precision": 0.6428571428571429, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1362513303756714, "eval_overall_accuracy": 0.9549170175873173, "eval_overall_f1": 0.7968545216251639, "eval_overall_precision": 0.7290167865707434, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3742, "eval_samples_per_second": 499.783, "eval_steps_per_second": 8.018, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.059523582458496, "learning_rate": 4.55e-05, "loss": 0.1256, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.728395061728395, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6344086021505376, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6511627906976745, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6176470588235294, "eval_ORGANIZATION_recall": 0.6885245901639344, "eval_PERSON_f1": 0.8847352024922119, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8452380952380952, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7671232876712328, "eval_TIME_number": 31, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.13946935534477234, "eval_overall_accuracy": 0.9536784741144414, "eval_overall_f1": 0.7894039735099337, "eval_overall_precision": 0.7286063569682152, "eval_overall_recall": 0.861271676300578, "eval_runtime": 0.3747, "eval_samples_per_second": 499.083, "eval_steps_per_second": 8.007, "step": 954 }, { "epoch": 10.0, "grad_norm": 0.9830942153930664, "learning_rate": 4.5e-05, "loss": 0.1227, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6962962962962963, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6351351351351351, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.896551724137931, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8614457831325302, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.782608695652174, "eval_TIME_number": 31, "eval_TIME_precision": 0.7105263157894737, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12411845475435257, "eval_overall_accuracy": 0.9583849393113698, "eval_overall_f1": 0.8134228187919462, "eval_overall_precision": 0.7593984962406015, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.377, "eval_samples_per_second": 495.985, "eval_steps_per_second": 7.957, "step": 1060 }, { "epoch": 11.0, "grad_norm": 0.3884367048740387, "learning_rate": 4.4500000000000004e-05, "loss": 0.1154, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7483870967741935, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6744186046511628, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.6769230769230768, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6376811594202898, "eval_ORGANIZATION_recall": 0.7213114754098361, "eval_PERSON_f1": 0.9022082018927446, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8719512195121951, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.6923076923076924, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5869565217391305, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12845103442668915, "eval_overall_accuracy": 0.9546693088927422, "eval_overall_f1": 0.7994652406417112, "eval_overall_precision": 0.7437810945273632, "eval_overall_recall": 0.8641618497109826, "eval_runtime": 0.3748, "eval_samples_per_second": 498.943, "eval_steps_per_second": 8.004, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.482397198677063, "learning_rate": 4.4000000000000006e-05, "loss": 0.1102, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.8163265306122449, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6616541353383459, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.7213114754098361, "eval_PERSON_f1": 0.9148264984227129, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8841463414634146, "eval_PERSON_recall": 0.9477124183006536, "eval_QUANTITY_f1": 0.7012987012987012, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12422426789999008, "eval_overall_accuracy": 0.9581372306167947, "eval_overall_f1": 0.8200270635994588, "eval_overall_precision": 0.7709923664122137, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3755, "eval_samples_per_second": 498.012, "eval_steps_per_second": 7.989, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.5229460000991821, "learning_rate": 4.35e-05, "loss": 0.1045, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.7549668874172186, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6951219512195121, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.7210884353741497, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6162790697674418, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9028213166144202, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8674698795180723, "eval_PERSON_recall": 0.9411764705882353, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.823529411764706, "eval_TIME_number": 31, "eval_TIME_precision": 0.7567567567567568, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.12873566150665283, "eval_overall_accuracy": 0.9611097349516968, "eval_overall_f1": 0.8137384412153236, "eval_overall_precision": 0.7493917274939172, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3736, "eval_samples_per_second": 500.496, "eval_steps_per_second": 8.029, "step": 1378 }, { "epoch": 14.0, "grad_norm": 0.913377583026886, "learning_rate": 4.3e-05, "loss": 0.103, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6901408450704226, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6049382716049383, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8622754491017964, "eval_PERSON_recall": 0.9411764705882353, "eval_QUANTITY_f1": 0.7105263157894737, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13010737299919128, "eval_overall_accuracy": 0.9583849393113698, "eval_overall_f1": 0.8158940397350993, "eval_overall_precision": 0.7530562347188264, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3724, "eval_samples_per_second": 502.128, "eval_steps_per_second": 8.056, "step": 1484 }, { "epoch": 15.0, "grad_norm": 0.28188779950141907, "learning_rate": 4.25e-05, "loss": 0.1017, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7631578947368421, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.6564885496183206, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6142857142857143, "eval_ORGANIZATION_recall": 0.7049180327868853, "eval_PERSON_f1": 0.9177215189873417, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8895705521472392, "eval_PERSON_recall": 0.9477124183006536, "eval_QUANTITY_f1": 0.7297297297297298, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12356830388307571, "eval_overall_accuracy": 0.9598711914788209, "eval_overall_f1": 0.8196721311475409, "eval_overall_precision": 0.7772020725388601, "eval_overall_recall": 0.8670520231213873, "eval_runtime": 0.375, "eval_samples_per_second": 498.728, "eval_steps_per_second": 8.001, "step": 1590 }, { "epoch": 16.0, "grad_norm": 0.5976079702377319, "learning_rate": 4.2e-05, "loss": 0.0944, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.7972972972972974, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7123287671232876, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.611764705882353, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.909657320872274, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8690476190476191, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8615384615384616, "eval_TIME_number": 31, "eval_TIME_precision": 0.8235294117647058, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.12926575541496277, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.8331108144192255, "eval_overall_precision": 0.7741935483870968, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3791, "eval_samples_per_second": 493.213, "eval_steps_per_second": 7.913, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.3376772701740265, "learning_rate": 4.15e-05, "loss": 0.0911, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.7468354430379747, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6629213483146067, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6993006993006993, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6097560975609756, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.874251497005988, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.75, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.13467147946357727, "eval_overall_accuracy": 0.9598711914788209, "eval_overall_f1": 0.8168642951251647, "eval_overall_precision": 0.7506053268765133, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.377, "eval_samples_per_second": 495.972, "eval_steps_per_second": 7.957, "step": 1802 }, { "epoch": 18.0, "grad_norm": 0.5633219480514526, "learning_rate": 4.1e-05, "loss": 0.0862, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.7891156462585034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7272727272727273, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.676056338028169, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9182389937106918, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8848484848484849, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.7397260273972602, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12517449259757996, "eval_overall_accuracy": 0.9611097349516968, "eval_overall_f1": 0.8326530612244898, "eval_overall_precision": 0.7866323907455013, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3742, "eval_samples_per_second": 499.67, "eval_steps_per_second": 8.016, "step": 1908 }, { "epoch": 19.0, "grad_norm": 0.9083814024925232, "learning_rate": 4.05e-05, "loss": 0.0861, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.7777777777777779, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7466666666666667, "eval_LOCATION_recall": 0.8115942028985508, "eval_ORGANIZATION_f1": 0.6818181818181818, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6338028169014085, "eval_ORGANIZATION_recall": 0.7377049180327869, "eval_PERSON_f1": 0.9085173501577287, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8780487804878049, "eval_PERSON_recall": 0.9411764705882353, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8615384615384616, "eval_TIME_number": 31, "eval_TIME_precision": 0.8235294117647058, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.12289129197597504, "eval_overall_accuracy": 0.9623482784245727, "eval_overall_f1": 0.823045267489712, "eval_overall_precision": 0.783289817232376, "eval_overall_recall": 0.8670520231213873, "eval_runtime": 0.3754, "eval_samples_per_second": 498.106, "eval_steps_per_second": 7.991, "step": 2014 }, { "epoch": 20.0, "grad_norm": 0.42938560247421265, "learning_rate": 4e-05, "loss": 0.0834, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.7651006711409397, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.7123287671232876, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.611764705882353, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9216300940438872, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8855421686746988, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.72, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13770651817321777, "eval_overall_accuracy": 0.9566509784493435, "eval_overall_f1": 0.8211920529801324, "eval_overall_precision": 0.7579462102689487, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3749, "eval_samples_per_second": 498.842, "eval_steps_per_second": 8.003, "step": 2120 }, { "epoch": 21.0, "grad_norm": 0.4163472056388855, "learning_rate": 3.9500000000000005e-05, "loss": 0.0812, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.7919463087248322, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7019867549668874, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5888888888888889, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9130434782608696, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8698224852071006, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.6933333333333334, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6046511627906976, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15470075607299805, "eval_overall_accuracy": 0.9529353480307159, "eval_overall_f1": 0.8156862745098038, "eval_overall_precision": 0.7446300715990454, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.374, "eval_samples_per_second": 500.009, "eval_steps_per_second": 8.022, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.5683150887489319, "learning_rate": 3.9000000000000006e-05, "loss": 0.0775, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7222222222222222, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6265060240963856, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9158878504672897, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7397260273972602, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.134428471326828, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8243064729194187, "eval_overall_precision": 0.7591240875912408, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3741, "eval_samples_per_second": 499.827, "eval_steps_per_second": 8.019, "step": 2332 }, { "epoch": 23.0, "grad_norm": 0.34687337279319763, "learning_rate": 3.85e-05, "loss": 0.0749, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8028169014084506, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7808219178082192, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.7323943661971831, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6419753086419753, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9341692789968652, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8975903614457831, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12430478632450104, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8443843031123139, "eval_overall_precision": 0.7938931297709924, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3735, "eval_samples_per_second": 500.696, "eval_steps_per_second": 8.033, "step": 2438 }, { "epoch": 24.0, "grad_norm": 4.703299045562744, "learning_rate": 3.8e-05, "loss": 0.0741, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6950354609929078, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6125, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.915360501567398, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8795180722891566, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13924448192119598, "eval_overall_accuracy": 0.9596234827842457, "eval_overall_f1": 0.8284182305630027, "eval_overall_precision": 0.7725, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.376, "eval_samples_per_second": 497.288, "eval_steps_per_second": 7.978, "step": 2544 }, { "epoch": 25.0, "grad_norm": 0.5041608214378357, "learning_rate": 3.7500000000000003e-05, "loss": 0.0723, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.75177304964539, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6625, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9158878504672897, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.14030230045318604, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.8368983957219251, "eval_overall_precision": 0.7786069651741293, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3717, "eval_samples_per_second": 503.108, "eval_steps_per_second": 8.071, "step": 2650 }, { "epoch": 26.0, "grad_norm": 1.0920377969741821, "learning_rate": 3.7e-05, "loss": 0.0711, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.786206896551724, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.7310344827586208, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6309523809523809, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.930817610062893, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.896969696969697, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14644105732440948, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8337801608579088, "eval_overall_precision": 0.7775, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.375, "eval_samples_per_second": 498.657, "eval_steps_per_second": 8.0, "step": 2756 }, { "epoch": 27.0, "grad_norm": 1.1851744651794434, "learning_rate": 3.65e-05, "loss": 0.0675, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7361111111111112, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6385542168674698, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.915360501567398, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8795180722891566, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13256658613681793, "eval_overall_accuracy": 0.9633391132028735, "eval_overall_f1": 0.8342245989304814, "eval_overall_precision": 0.7761194029850746, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3754, "eval_samples_per_second": 498.103, "eval_steps_per_second": 7.991, "step": 2862 }, { "epoch": 28.0, "grad_norm": 1.8179621696472168, "learning_rate": 3.6e-05, "loss": 0.0656, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.7972972972972974, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7313432835820896, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6712328767123288, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9367088607594937, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9079754601226994, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.782608695652174, "eval_TIME_number": 31, "eval_TIME_precision": 0.7105263157894737, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13896366953849792, "eval_overall_accuracy": 0.9630914045082982, "eval_overall_f1": 0.842391304347826, "eval_overall_precision": 0.7948717948717948, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3798, "eval_samples_per_second": 492.362, "eval_steps_per_second": 7.899, "step": 2968 }, { "epoch": 29.0, "grad_norm": 1.071942925453186, "learning_rate": 3.55e-05, "loss": 0.0666, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7272727272727272, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6341463414634146, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9216300940438872, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8855421686746988, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1382647156715393, "eval_overall_accuracy": 0.9621005697299975, "eval_overall_f1": 0.8324468085106382, "eval_overall_precision": 0.770935960591133, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3732, "eval_samples_per_second": 501.13, "eval_steps_per_second": 8.04, "step": 3074 }, { "epoch": 30.0, "grad_norm": 0.5458754897117615, "learning_rate": 3.5e-05, "loss": 0.065, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9333333333333333, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9074074074074074, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1359969526529312, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.839142091152815, "eval_overall_precision": 0.7825, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3753, "eval_samples_per_second": 498.297, "eval_steps_per_second": 7.994, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.8183054327964783, "learning_rate": 3.45e-05, "loss": 0.0641, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7058823529411764, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.64, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8059701492537314, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7714285714285715, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13141290843486786, "eval_overall_accuracy": 0.9625959871191478, "eval_overall_f1": 0.840108401084011, "eval_overall_precision": 0.7908163265306123, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3761, "eval_samples_per_second": 497.223, "eval_steps_per_second": 7.977, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.7471626400947571, "learning_rate": 3.4000000000000007e-05, "loss": 0.0625, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7153284671532848, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6447368421052632, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9341692789968652, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8975903614457831, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13418298959732056, "eval_overall_accuracy": 0.9625959871191478, "eval_overall_f1": 0.8344549125168238, "eval_overall_precision": 0.7808564231738035, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3778, "eval_samples_per_second": 495.024, "eval_steps_per_second": 7.942, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.30342888832092285, "learning_rate": 3.35e-05, "loss": 0.0619, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6906474820143885, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6153846153846154, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9245283018867925, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8909090909090909, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7397260273972602, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7536231884057972, "eval_TIME_number": 31, "eval_TIME_precision": 0.6842105263157895, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.141060933470726, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.822429906542056, "eval_overall_precision": 0.7642679900744417, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3745, "eval_samples_per_second": 499.347, "eval_steps_per_second": 8.011, "step": 3498 }, { "epoch": 34.0, "grad_norm": 0.6614820957183838, "learning_rate": 3.3e-05, "loss": 0.0602, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.689655172413793, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5952380952380952, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9341692789968652, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8975903614457831, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7123287671232876, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6341463414634146, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7536231884057972, "eval_TIME_number": 31, "eval_TIME_precision": 0.6842105263157895, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.1591266542673111, "eval_overall_accuracy": 0.9556601436710429, "eval_overall_f1": 0.8221343873517786, "eval_overall_precision": 0.7554479418886199, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.374, "eval_samples_per_second": 500.045, "eval_steps_per_second": 8.022, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.9236454963684082, "learning_rate": 3.2500000000000004e-05, "loss": 0.0582, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.8026315789473685, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.620253164556962, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9249999999999999, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8862275449101796, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7761194029850746, "eval_TIME_number": 31, "eval_TIME_precision": 0.7222222222222222, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14139990508556366, "eval_overall_accuracy": 0.9621005697299975, "eval_overall_f1": 0.8304405874499332, "eval_overall_precision": 0.771712158808933, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3774, "eval_samples_per_second": 495.502, "eval_steps_per_second": 7.949, "step": 3710 }, { "epoch": 36.0, "grad_norm": 0.27499887347221375, "learning_rate": 3.2000000000000005e-05, "loss": 0.0574, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.7368421052631579, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6746987951807228, "eval_LOCATION_recall": 0.8115942028985508, "eval_ORGANIZATION_f1": 0.725925925925926, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6621621621621622, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9371069182389938, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9030303030303031, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8059701492537314, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7714285714285715, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14524929225444794, "eval_overall_accuracy": 0.9625959871191478, "eval_overall_f1": 0.8346883468834689, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3745, "eval_samples_per_second": 499.274, "eval_steps_per_second": 8.01, "step": 3816 }, { "epoch": 37.0, "grad_norm": 1.040267825126648, "learning_rate": 3.15e-05, "loss": 0.0551, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.7549668874172186, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6951219512195121, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.7058823529411764, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.64, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9341692789968652, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8975903614457831, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.75, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14648863673210144, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.8263795423956932, "eval_overall_precision": 0.7732997481108312, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3762, "eval_samples_per_second": 497.137, "eval_steps_per_second": 7.975, "step": 3922 }, { "epoch": 38.0, "grad_norm": 0.9761358499526978, "learning_rate": 3.1e-05, "loss": 0.056, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7007299270072993, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.631578947368421, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9303797468354431, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.901840490797546, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1346336156129837, "eval_overall_accuracy": 0.9643299479811741, "eval_overall_f1": 0.8385345997286295, "eval_overall_precision": 0.7902813299232737, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3754, "eval_samples_per_second": 498.071, "eval_steps_per_second": 7.99, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.7863456606864929, "learning_rate": 3.05e-05, "loss": 0.0571, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7073170731707317, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7338129496402876, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6538461538461539, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8125, "eval_TIME_number": 31, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13755863904953003, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.835579514824798, "eval_overall_precision": 0.7828282828282829, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3744, "eval_samples_per_second": 499.503, "eval_steps_per_second": 8.013, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.4372481107711792, "learning_rate": 3e-05, "loss": 0.0509, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.7651006711409397, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.6814814814814815, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6216216216216216, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13881690800189972, "eval_overall_accuracy": 0.9623482784245727, "eval_overall_f1": 0.828804347826087, "eval_overall_precision": 0.782051282051282, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3754, "eval_samples_per_second": 498.168, "eval_steps_per_second": 7.992, "step": 4240 }, { "epoch": 41.0, "grad_norm": 1.0561209917068481, "learning_rate": 2.95e-05, "loss": 0.052, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6891891891891891, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5862068965517241, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9245283018867925, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8909090909090909, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14717642962932587, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.8353413654618473, "eval_overall_precision": 0.7780548628428927, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3875, "eval_samples_per_second": 482.629, "eval_steps_per_second": 7.743, "step": 4346 }, { "epoch": 42.0, "grad_norm": 1.18325936794281, "learning_rate": 2.9e-05, "loss": 0.0526, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.7894736842105263, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7101449275362318, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.1472916603088379, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.8367071524966261, "eval_overall_precision": 0.7848101265822784, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3724, "eval_samples_per_second": 502.108, "eval_steps_per_second": 8.055, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.44864386320114136, "learning_rate": 2.8499999999999998e-05, "loss": 0.0503, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.7919463087248322, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6616541353383459, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.7213114754098361, "eval_PERSON_f1": 0.9456869009584665, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.925, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14042706787586212, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.8367626886145405, "eval_overall_precision": 0.7963446475195822, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3766, "eval_samples_per_second": 496.505, "eval_steps_per_second": 7.965, "step": 4558 }, { "epoch": 44.0, "grad_norm": 1.731616497039795, "learning_rate": 2.8000000000000003e-05, "loss": 0.05, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7058823529411764, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.64, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.1412889063358307, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.8335588633288228, "eval_overall_precision": 0.7837150127226463, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.381, "eval_samples_per_second": 490.863, "eval_steps_per_second": 7.875, "step": 4664 }, { "epoch": 45.0, "grad_norm": 0.8027646541595459, "learning_rate": 2.7500000000000004e-05, "loss": 0.0488, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.676470588235294, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6133333333333333, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13843049108982086, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8431105047748976, "eval_overall_precision": 0.7984496124031008, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3744, "eval_samples_per_second": 499.493, "eval_steps_per_second": 8.013, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.44881823658943176, "learning_rate": 2.7000000000000002e-05, "loss": 0.0471, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.8079470198675496, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6956521739130435, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6233766233766234, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9211356466876972, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8902439024390244, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8125, "eval_TIME_number": 31, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13977740705013275, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8335588633288228, "eval_overall_precision": 0.7837150127226463, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3761, "eval_samples_per_second": 497.169, "eval_steps_per_second": 7.976, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.5853442549705505, "learning_rate": 2.6500000000000004e-05, "loss": 0.0483, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.7891156462585034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7153284671532848, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6447368421052632, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9216300940438872, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8855421686746988, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14364777505397797, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.8308525033829499, "eval_overall_precision": 0.7811704834605598, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3752, "eval_samples_per_second": 498.37, "eval_steps_per_second": 7.995, "step": 4982 }, { "epoch": 48.0, "grad_norm": 1.8860626220703125, "learning_rate": 2.6000000000000002e-05, "loss": 0.0451, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7101449275362318, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9341692789968652, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8975903614457831, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7761194029850746, "eval_TIME_number": 31, "eval_TIME_precision": 0.7222222222222222, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.15161269903182983, "eval_overall_accuracy": 0.9621005697299975, "eval_overall_f1": 0.8364611260053619, "eval_overall_precision": 0.78, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3753, "eval_samples_per_second": 498.293, "eval_steps_per_second": 7.994, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.2444094717502594, "learning_rate": 2.5500000000000003e-05, "loss": 0.0471, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7352941176470588, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9426751592356687, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9192546583850931, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14613822102546692, "eval_overall_accuracy": 0.9643299479811741, "eval_overall_f1": 0.8451086956521738, "eval_overall_precision": 0.7974358974358975, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3786, "eval_samples_per_second": 493.953, "eval_steps_per_second": 7.924, "step": 5194 }, { "epoch": 50.0, "grad_norm": 0.8297089338302612, "learning_rate": 2.5e-05, "loss": 0.0419, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7164179104477612, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6575342465753424, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8253968253968254, "eval_TIME_number": 31, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14306952059268951, "eval_overall_accuracy": 0.9650730740648997, "eval_overall_f1": 0.8477366255144032, "eval_overall_precision": 0.8067885117493473, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3745, "eval_samples_per_second": 499.298, "eval_steps_per_second": 8.01, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.4903518855571747, "learning_rate": 2.45e-05, "loss": 0.0406, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7083333333333334, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6144578313253012, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9400630914826499, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9085365853658537, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15998348593711853, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.8346666666666667, "eval_overall_precision": 0.7747524752475248, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3771, "eval_samples_per_second": 495.853, "eval_steps_per_second": 7.955, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.886262834072113, "learning_rate": 2.4e-05, "loss": 0.0427, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.723404255319149, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6375, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9367088607594937, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9079754601226994, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.15491357445716858, "eval_overall_accuracy": 0.9623482784245727, "eval_overall_f1": 0.8378378378378379, "eval_overall_precision": 0.7868020304568528, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.377, "eval_samples_per_second": 495.985, "eval_steps_per_second": 7.957, "step": 5512 }, { "epoch": 53.0, "grad_norm": 1.1054624319076538, "learning_rate": 2.35e-05, "loss": 0.0426, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.8163265306122449, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7058823529411764, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.64, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15161831676959991, "eval_overall_accuracy": 0.9633391132028735, "eval_overall_f1": 0.8408163265306122, "eval_overall_precision": 0.794344473007712, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3745, "eval_samples_per_second": 499.342, "eval_steps_per_second": 8.011, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.31659141182899475, "learning_rate": 2.3000000000000003e-05, "loss": 0.0401, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.7945205479452054, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7310344827586208, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6309523809523809, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.93125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8922155688622755, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.15523718297481537, "eval_overall_accuracy": 0.9630914045082982, "eval_overall_f1": 0.8364611260053619, "eval_overall_precision": 0.78, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3741, "eval_samples_per_second": 499.826, "eval_steps_per_second": 8.019, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.8402573466300964, "learning_rate": 2.25e-05, "loss": 0.0399, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6962962962962963, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6351351351351351, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14873124659061432, "eval_overall_accuracy": 0.9633391132028735, "eval_overall_f1": 0.828146143437077, "eval_overall_precision": 0.7786259541984732, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3761, "eval_samples_per_second": 497.222, "eval_steps_per_second": 7.977, "step": 5830 }, { "epoch": 56.0, "grad_norm": 2.248713254928589, "learning_rate": 2.2000000000000003e-05, "loss": 0.0402, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.7972972972972974, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6956521739130435, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6233766233766234, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9371069182389938, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9030303030303031, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15828868746757507, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.8328840970350404, "eval_overall_precision": 0.7803030303030303, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.376, "eval_samples_per_second": 497.316, "eval_steps_per_second": 7.978, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.34086835384368896, "learning_rate": 2.15e-05, "loss": 0.0406, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.8163265306122449, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7164179104477612, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6575342465753424, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9400630914826499, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9085365853658537, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15400414168834686, "eval_overall_accuracy": 0.9653207827594749, "eval_overall_f1": 0.8469945355191256, "eval_overall_precision": 0.8031088082901554, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3749, "eval_samples_per_second": 498.776, "eval_steps_per_second": 8.002, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.3621896505355835, "learning_rate": 2.1e-05, "loss": 0.0402, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9341692789968652, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8975903614457831, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1636234074831009, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8364611260053619, "eval_overall_precision": 0.78, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3779, "eval_samples_per_second": 494.823, "eval_steps_per_second": 7.938, "step": 6148 }, { "epoch": 59.0, "grad_norm": 0.6952288746833801, "learning_rate": 2.05e-05, "loss": 0.0387, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7375886524822695, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.1611531525850296, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.8364611260053619, "eval_overall_precision": 0.78, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3758, "eval_samples_per_second": 497.564, "eval_steps_per_second": 7.982, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.3612290322780609, "learning_rate": 2e-05, "loss": 0.0402, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.6808510638297871, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8, "eval_TIME_number": 31, "eval_TIME_precision": 0.717948717948718, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.16257652640342712, "eval_overall_accuracy": 0.9601189001733961, "eval_overall_f1": 0.8235294117647058, "eval_overall_precision": 0.7661691542288557, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3768, "eval_samples_per_second": 496.251, "eval_steps_per_second": 7.961, "step": 6360 }, { "epoch": 61.0, "grad_norm": 0.3965584337711334, "learning_rate": 1.9500000000000003e-05, "loss": 0.0382, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7050359712230215, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6282051282051282, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8115942028985507, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7567567567567568, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15209117531776428, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8439620081411127, "eval_overall_precision": 0.7953964194373402, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3753, "eval_samples_per_second": 498.223, "eval_steps_per_second": 7.993, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.3826664984226227, "learning_rate": 1.9e-05, "loss": 0.038, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7246376811594203, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6493506493506493, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9400630914826499, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9085365853658537, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7999999999999999, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7368421052631579, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1556433141231537, "eval_overall_accuracy": 0.9653207827594749, "eval_overall_f1": 0.8497970230040597, "eval_overall_precision": 0.7989821882951654, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3732, "eval_samples_per_second": 501.096, "eval_steps_per_second": 8.039, "step": 6572 }, { "epoch": 63.0, "grad_norm": 0.16946372389793396, "learning_rate": 1.85e-05, "loss": 0.0391, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.7919463087248322, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7299270072992702, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6578947368421053, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9400630914826499, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9085365853658537, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8125, "eval_TIME_number": 31, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.15297681093215942, "eval_overall_accuracy": 0.9650730740648997, "eval_overall_f1": 0.8435374149659864, "eval_overall_precision": 0.7969151670951157, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3768, "eval_samples_per_second": 496.267, "eval_steps_per_second": 7.961, "step": 6678 }, { "epoch": 64.0, "grad_norm": 0.5709309577941895, "learning_rate": 1.8e-05, "loss": 0.0377, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.7919463087248322, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7205882352941175, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6533333333333333, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9400630914826499, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9085365853658537, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1536598950624466, "eval_overall_accuracy": 0.9653207827594749, "eval_overall_f1": 0.8451086956521738, "eval_overall_precision": 0.7974358974358975, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3742, "eval_samples_per_second": 499.72, "eval_steps_per_second": 8.017, "step": 6784 }, { "epoch": 65.0, "grad_norm": 0.6132174134254456, "learning_rate": 1.75e-05, "loss": 0.0345, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.7972972972972974, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.723404255319149, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6375, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15807974338531494, "eval_overall_accuracy": 0.9635868218974486, "eval_overall_f1": 0.8432432432432434, "eval_overall_precision": 0.7918781725888325, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3793, "eval_samples_per_second": 493.053, "eval_steps_per_second": 7.91, "step": 6890 }, { "epoch": 66.0, "grad_norm": 1.0831232070922852, "learning_rate": 1.7000000000000003e-05, "loss": 0.0367, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.7837837837837838, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7194244604316549, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6410256410256411, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9463722397476341, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9146341463414634, "eval_PERSON_recall": 0.9803921568627451, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1538369357585907, "eval_overall_accuracy": 0.9648253653703245, "eval_overall_f1": 0.8405405405405405, "eval_overall_precision": 0.7893401015228426, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3751, "eval_samples_per_second": 498.591, "eval_steps_per_second": 7.999, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.5706846714019775, "learning_rate": 1.65e-05, "loss": 0.0338, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7338129496402876, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6538461538461539, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1590246558189392, "eval_overall_accuracy": 0.9660639088432004, "eval_overall_f1": 0.8470906630581866, "eval_overall_precision": 0.7964376590330788, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3739, "eval_samples_per_second": 500.15, "eval_steps_per_second": 8.024, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.8377193808555603, "learning_rate": 1.6000000000000003e-05, "loss": 0.0346, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.821917808219178, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7792207792207793, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7153284671532848, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6447368421052632, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15623514354228973, "eval_overall_accuracy": 0.9650730740648997, "eval_overall_f1": 0.8474114441416893, "eval_overall_precision": 0.8015463917525774, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3737, "eval_samples_per_second": 500.375, "eval_steps_per_second": 8.027, "step": 7208 }, { "epoch": 69.0, "grad_norm": 0.5355998277664185, "learning_rate": 1.55e-05, "loss": 0.0333, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.8163265306122449, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.711111111111111, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6486486486486487, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15333040058612823, "eval_overall_accuracy": 0.9650730740648997, "eval_overall_f1": 0.8458390177353343, "eval_overall_precision": 0.8010335917312662, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3742, "eval_samples_per_second": 499.782, "eval_steps_per_second": 8.018, "step": 7314 }, { "epoch": 70.0, "grad_norm": 0.8504950404167175, "learning_rate": 1.5e-05, "loss": 0.0339, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7194244604316549, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6410256410256411, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9490445859872612, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9254658385093167, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15827783942222595, "eval_overall_accuracy": 0.9643299479811741, "eval_overall_f1": 0.8451086956521738, "eval_overall_precision": 0.7974358974358975, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3754, "eval_samples_per_second": 498.15, "eval_steps_per_second": 7.992, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.0832040011882782, "learning_rate": 1.45e-05, "loss": 0.0336, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.8079470198675496, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7338129496402876, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6538461538461539, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16177228093147278, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8463611859838275, "eval_overall_precision": 0.7929292929292929, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3774, "eval_samples_per_second": 495.5, "eval_steps_per_second": 7.949, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.9196206331253052, "learning_rate": 1.4000000000000001e-05, "loss": 0.0321, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6993006993006993, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6097560975609756, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17121733725070953, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.8262032085561497, "eval_overall_precision": 0.7686567164179104, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3765, "eval_samples_per_second": 496.728, "eval_steps_per_second": 7.969, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.9101676344871521, "learning_rate": 1.3500000000000001e-05, "loss": 0.033, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7058823529411764, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.64, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1599177122116089, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8462585034013606, "eval_overall_precision": 0.7994858611825193, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3727, "eval_samples_per_second": 501.679, "eval_steps_per_second": 8.048, "step": 7738 }, { "epoch": 74.0, "grad_norm": 0.29207730293273926, "learning_rate": 1.3000000000000001e-05, "loss": 0.032, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6911764705882353, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6266666666666667, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16745725274085999, "eval_overall_accuracy": 0.9625959871191478, "eval_overall_f1": 0.8319783197831978, "eval_overall_precision": 0.7831632653061225, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3751, "eval_samples_per_second": 498.534, "eval_steps_per_second": 7.998, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.41321995854377747, "learning_rate": 1.25e-05, "loss": 0.0327, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7058823529411764, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.64, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9367088607594937, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9079754601226994, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1649351716041565, "eval_overall_accuracy": 0.9630914045082982, "eval_overall_f1": 0.842391304347826, "eval_overall_precision": 0.7948717948717948, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3742, "eval_samples_per_second": 499.772, "eval_steps_per_second": 8.018, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.3396766185760498, "learning_rate": 1.2e-05, "loss": 0.0316, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6911764705882353, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6266666666666667, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16384615004062653, "eval_overall_accuracy": 0.9633391132028735, "eval_overall_f1": 0.8392370572207084, "eval_overall_precision": 0.7938144329896907, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3738, "eval_samples_per_second": 500.223, "eval_steps_per_second": 8.025, "step": 8056 }, { "epoch": 77.0, "grad_norm": 2.2026262283325195, "learning_rate": 1.1500000000000002e-05, "loss": 0.0311, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6666666666666666, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5974025974025974, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.9426751592356687, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9192546583850931, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1676771342754364, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.8297297297297296, "eval_overall_precision": 0.7791878172588832, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3753, "eval_samples_per_second": 498.284, "eval_steps_per_second": 7.994, "step": 8162 }, { "epoch": 78.0, "grad_norm": 1.9219529628753662, "learning_rate": 1.1000000000000001e-05, "loss": 0.0313, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6808510638297871, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16492274403572083, "eval_overall_accuracy": 0.9635868218974486, "eval_overall_f1": 0.8346883468834689, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3755, "eval_samples_per_second": 497.993, "eval_steps_per_second": 7.989, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.4185786545276642, "learning_rate": 1.05e-05, "loss": 0.0297, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6969696969696969, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.647887323943662, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.9303797468354431, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.901840490797546, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1650223582983017, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8349249658935879, "eval_overall_precision": 0.7906976744186046, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3737, "eval_samples_per_second": 500.389, "eval_steps_per_second": 8.028, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.915241003036499, "learning_rate": 1e-05, "loss": 0.0299, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6962962962962963, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6351351351351351, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16577459871768951, "eval_overall_accuracy": 0.964082239286599, "eval_overall_f1": 0.8365122615803814, "eval_overall_precision": 0.7912371134020618, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3818, "eval_samples_per_second": 489.811, "eval_steps_per_second": 7.858, "step": 8480 }, { "epoch": 81.0, "grad_norm": 1.0720077753067017, "learning_rate": 9.5e-06, "loss": 0.029, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6666666666666666, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5974025974025974, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7647058823529411, "eval_TIME_number": 31, "eval_TIME_precision": 0.7027027027027027, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.17195791006088257, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8209959623149394, "eval_overall_precision": 0.7682619647355163, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3835, "eval_samples_per_second": 487.605, "eval_steps_per_second": 7.823, "step": 8586 }, { "epoch": 82.0, "grad_norm": 0.3890499472618103, "learning_rate": 9e-06, "loss": 0.0309, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7175572519083969, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6714285714285714, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16233526170253754, "eval_overall_accuracy": 0.9658162001486252, "eval_overall_f1": 0.8449931412894376, "eval_overall_precision": 0.804177545691906, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3819, "eval_samples_per_second": 489.687, "eval_steps_per_second": 7.856, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.3679879903793335, "learning_rate": 8.500000000000002e-06, "loss": 0.0286, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7050359712230215, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6282051282051282, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16112035512924194, "eval_overall_accuracy": 0.964082239286599, "eval_overall_f1": 0.8389715832205684, "eval_overall_precision": 0.7888040712468194, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3787, "eval_samples_per_second": 493.757, "eval_steps_per_second": 7.921, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.78831946849823, "learning_rate": 8.000000000000001e-06, "loss": 0.0286, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7246376811594203, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6493506493506493, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16939504444599152, "eval_overall_accuracy": 0.9630914045082982, "eval_overall_f1": 0.8405405405405405, "eval_overall_precision": 0.7893401015228426, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3839, "eval_samples_per_second": 487.106, "eval_steps_per_second": 7.815, "step": 8904 }, { "epoch": 85.0, "grad_norm": 1.5276166200637817, "learning_rate": 7.5e-06, "loss": 0.0298, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7014925373134328, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6438356164383562, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7536231884057972, "eval_TIME_number": 31, "eval_TIME_precision": 0.6842105263157895, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.1691165566444397, "eval_overall_accuracy": 0.9633391132028735, "eval_overall_f1": 0.830393487109905, "eval_overall_precision": 0.782608695652174, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3784, "eval_samples_per_second": 494.156, "eval_steps_per_second": 7.928, "step": 9010 }, { "epoch": 86.0, "grad_norm": 1.4778416156768799, "learning_rate": 7.000000000000001e-06, "loss": 0.0293, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.7972972972972974, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.711111111111111, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6486486486486487, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1705159842967987, "eval_overall_accuracy": 0.9638345305920237, "eval_overall_f1": 0.8365122615803814, "eval_overall_precision": 0.7912371134020618, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3783, "eval_samples_per_second": 494.321, "eval_steps_per_second": 7.93, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.7736322283744812, "learning_rate": 6.5000000000000004e-06, "loss": 0.0281, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7058823529411764, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.64, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.782608695652174, "eval_TIME_number": 31, "eval_TIME_precision": 0.7105263157894737, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16937683522701263, "eval_overall_accuracy": 0.9623482784245727, "eval_overall_f1": 0.835820895522388, "eval_overall_precision": 0.7877237851662404, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3782, "eval_samples_per_second": 494.406, "eval_steps_per_second": 7.932, "step": 9222 }, { "epoch": 88.0, "grad_norm": 0.9048134684562683, "learning_rate": 6e-06, "loss": 0.0294, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7246376811594203, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6493506493506493, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9426751592356687, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9192546583850931, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1706814169883728, "eval_overall_accuracy": 0.9635868218974486, "eval_overall_f1": 0.8416779431664413, "eval_overall_precision": 0.7913486005089059, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3792, "eval_samples_per_second": 493.178, "eval_steps_per_second": 7.912, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.8254857659339905, "learning_rate": 5.500000000000001e-06, "loss": 0.0279, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.7972972972972974, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7101449275362318, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9367088607594937, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9079754601226994, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16873446106910706, "eval_overall_accuracy": 0.9633391132028735, "eval_overall_f1": 0.8385345997286295, "eval_overall_precision": 0.7902813299232737, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3786, "eval_samples_per_second": 493.963, "eval_steps_per_second": 7.925, "step": 9434 }, { "epoch": 90.0, "grad_norm": 6.16793155670166, "learning_rate": 5e-06, "loss": 0.0263, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8163265306122449, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.725925925925926, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6621621621621622, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17040900886058807, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8446866485013624, "eval_overall_precision": 0.7989690721649485, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3802, "eval_samples_per_second": 491.899, "eval_steps_per_second": 7.891, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.16071051359176636, "learning_rate": 4.5e-06, "loss": 0.0263, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.7972972972972974, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7205882352941175, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6533333333333333, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9426751592356687, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9192546583850931, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16665896773338318, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8408163265306122, "eval_overall_precision": 0.794344473007712, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3786, "eval_samples_per_second": 493.888, "eval_steps_per_second": 7.923, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.42266806960105896, "learning_rate": 4.000000000000001e-06, "loss": 0.0253, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7067669172932329, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6527777777777778, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16992609202861786, "eval_overall_accuracy": 0.964082239286599, "eval_overall_f1": 0.8380952380952382, "eval_overall_precision": 0.7917737789203085, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3794, "eval_samples_per_second": 492.83, "eval_steps_per_second": 7.906, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.28303977847099304, "learning_rate": 3.5000000000000004e-06, "loss": 0.0268, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7014925373134328, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6438356164383562, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.782608695652174, "eval_TIME_number": 31, "eval_TIME_precision": 0.7105263157894737, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17390000820159912, "eval_overall_accuracy": 0.9633391132028735, "eval_overall_f1": 0.8346883468834689, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3786, "eval_samples_per_second": 493.969, "eval_steps_per_second": 7.925, "step": 9858 }, { "epoch": 94.0, "grad_norm": 1.3909311294555664, "learning_rate": 3e-06, "loss": 0.0258, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6962962962962963, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6351351351351351, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17267082631587982, "eval_overall_accuracy": 0.9638345305920237, "eval_overall_f1": 0.8373983739837398, "eval_overall_precision": 0.7882653061224489, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3812, "eval_samples_per_second": 490.593, "eval_steps_per_second": 7.87, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.2576075792312622, "learning_rate": 2.5e-06, "loss": 0.0266, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6962962962962963, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6351351351351351, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7761194029850746, "eval_TIME_number": 31, "eval_TIME_precision": 0.7222222222222222, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.17561542987823486, "eval_overall_accuracy": 0.9623482784245727, "eval_overall_f1": 0.8308525033829499, "eval_overall_precision": 0.7811704834605598, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3798, "eval_samples_per_second": 492.339, "eval_steps_per_second": 7.898, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.6370512247085571, "learning_rate": 2.0000000000000003e-06, "loss": 0.0269, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7299270072992702, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6578947368421053, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17201797664165497, "eval_overall_accuracy": 0.9638345305920237, "eval_overall_f1": 0.8412483039348712, "eval_overall_precision": 0.7928388746803069, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3782, "eval_samples_per_second": 494.463, "eval_steps_per_second": 7.933, "step": 10176 }, { "epoch": 97.0, "grad_norm": 0.20887865126132965, "learning_rate": 1.5e-06, "loss": 0.0254, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7218045112781954, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17065702378749847, "eval_overall_accuracy": 0.9638345305920237, "eval_overall_f1": 0.8392370572207084, "eval_overall_precision": 0.7938144329896907, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.38, "eval_samples_per_second": 492.121, "eval_steps_per_second": 7.895, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.5937870144844055, "learning_rate": 1.0000000000000002e-06, "loss": 0.0259, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7313432835820896, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6712328767123288, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17093446850776672, "eval_overall_accuracy": 0.9643299479811741, "eval_overall_f1": 0.8431105047748976, "eval_overall_precision": 0.7984496124031008, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3859, "eval_samples_per_second": 484.64, "eval_steps_per_second": 7.775, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.9572729468345642, "learning_rate": 5.000000000000001e-07, "loss": 0.0263, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7313432835820896, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6712328767123288, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17115430533885956, "eval_overall_accuracy": 0.9648253653703245, "eval_overall_f1": 0.8446866485013624, "eval_overall_precision": 0.7989690721649485, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3755, "eval_samples_per_second": 498.013, "eval_steps_per_second": 7.99, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.8170201778411865, "learning_rate": 0.0, "loss": 0.0259, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7313432835820896, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6712328767123288, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17119528353214264, "eval_overall_accuracy": 0.9648253653703245, "eval_overall_f1": 0.8446866485013624, "eval_overall_precision": 0.7989690721649485, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3777, "eval_samples_per_second": 495.061, "eval_steps_per_second": 7.942, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5088556202474382.0, "train_loss": 0.07243871596624267, "train_runtime": 604.8321, "train_samples_per_second": 278.92, "train_steps_per_second": 17.526 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5088556202474382.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }