{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 1.289084553718567, "learning_rate": 4.9500000000000004e-05, "loss": 0.9293, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.012738853503184716, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.25, "eval_PERSON_recall": 0.006535947712418301, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0, "eval_TIME_number": 31, "eval_TIME_precision": 0.0, "eval_TIME_recall": 0.0, "eval_loss": 0.6359996199607849, "eval_overall_accuracy": 0.8357691354966559, "eval_overall_f1": 0.005698005698005698, "eval_overall_precision": 0.2, "eval_overall_recall": 0.002890173410404624, "eval_runtime": 0.3296, "eval_samples_per_second": 567.378, "eval_steps_per_second": 9.102, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.5572154521942139, "learning_rate": 4.9e-05, "loss": 0.5712, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.22471910112359553, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.5, "eval_LOCATION_recall": 0.14492753623188406, "eval_ORGANIZATION_f1": 0.046511627906976744, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.08, "eval_ORGANIZATION_recall": 0.03278688524590164, "eval_PERSON_f1": 0.45, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.4311377245508982, "eval_PERSON_recall": 0.47058823529411764, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.5384615384615384, "eval_TIME_number": 31, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.45161290322580644, "eval_loss": 0.43386390805244446, "eval_overall_accuracy": 0.8806044092147635, "eval_overall_f1": 0.33851468048359246, "eval_overall_precision": 0.4206008583690987, "eval_overall_recall": 0.2832369942196532, "eval_runtime": 0.3244, "eval_samples_per_second": 576.457, "eval_steps_per_second": 9.248, "step": 212 }, { "epoch": 3.0, "grad_norm": 1.6938573122024536, "learning_rate": 4.85e-05, "loss": 0.4084, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.5405405405405406, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.5063291139240507, "eval_LOCATION_recall": 0.5797101449275363, "eval_ORGANIZATION_f1": 0.29059829059829057, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.30357142857142855, "eval_ORGANIZATION_recall": 0.2786885245901639, "eval_PERSON_f1": 0.6467391304347827, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.5534883720930233, "eval_PERSON_recall": 0.7777777777777778, "eval_QUANTITY_f1": 0.22580645161290322, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.23333333333333334, "eval_QUANTITY_recall": 0.21875, "eval_TIME_f1": 0.6875, "eval_TIME_number": 31, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.7096774193548387, "eval_loss": 0.3173196017742157, "eval_overall_accuracy": 0.9165221699281645, "eval_overall_f1": 0.5401844532279314, "eval_overall_precision": 0.4963680387409201, "eval_overall_recall": 0.5924855491329479, "eval_runtime": 0.3294, "eval_samples_per_second": 567.711, "eval_steps_per_second": 9.108, "step": 318 }, { "epoch": 4.0, "grad_norm": 3.1388819217681885, "learning_rate": 4.8e-05, "loss": 0.306, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.6143790849673202, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.5595238095238095, "eval_LOCATION_recall": 0.6811594202898551, "eval_ORGANIZATION_f1": 0.4444444444444445, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.4642857142857143, "eval_ORGANIZATION_recall": 0.4262295081967213, "eval_PERSON_f1": 0.7669616519174042, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.6989247311827957, "eval_PERSON_recall": 0.8496732026143791, "eval_QUANTITY_f1": 0.6086956521739131, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5675675675675675, "eval_QUANTITY_recall": 0.65625, "eval_TIME_f1": 0.8064516129032258, "eval_TIME_number": 31, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8064516129032258, "eval_loss": 0.22655707597732544, "eval_overall_accuracy": 0.9370819915779044, "eval_overall_f1": 0.672972972972973, "eval_overall_precision": 0.631979695431472, "eval_overall_recall": 0.7196531791907514, "eval_runtime": 0.3329, "eval_samples_per_second": 561.669, "eval_steps_per_second": 9.011, "step": 424 }, { "epoch": 5.0, "grad_norm": 2.1097211837768555, "learning_rate": 4.75e-05, "loss": 0.2369, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.6285714285714286, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.5188679245283019, "eval_LOCATION_recall": 0.7971014492753623, "eval_ORGANIZATION_f1": 0.5442176870748299, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.46511627906976744, "eval_ORGANIZATION_recall": 0.6557377049180327, "eval_PERSON_f1": 0.7930029154518949, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.7157894736842105, "eval_PERSON_recall": 0.8888888888888888, "eval_QUANTITY_f1": 0.5499999999999999, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.4583333333333333, "eval_QUANTITY_recall": 0.6875, "eval_TIME_f1": 0.8125, "eval_TIME_number": 31, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.21178996562957764, "eval_overall_accuracy": 0.9380728263562051, "eval_overall_f1": 0.6897404202719406, "eval_overall_precision": 0.6025917926565875, "eval_overall_recall": 0.8063583815028902, "eval_runtime": 0.3324, "eval_samples_per_second": 562.65, "eval_steps_per_second": 9.026, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.1763736009597778, "learning_rate": 4.7e-05, "loss": 0.1993, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7037037037037037, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6129032258064516, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.6153846153846154, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5365853658536586, "eval_ORGANIZATION_recall": 0.7213114754098361, "eval_PERSON_f1": 0.8195718654434252, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.7701149425287356, "eval_PERSON_recall": 0.8758169934640523, "eval_QUANTITY_f1": 0.5753424657534246, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5121951219512195, "eval_QUANTITY_recall": 0.65625, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17126347124576569, "eval_overall_accuracy": 0.9482288828337875, "eval_overall_f1": 0.7369791666666667, "eval_overall_precision": 0.6706161137440758, "eval_overall_recall": 0.8179190751445087, "eval_runtime": 0.3356, "eval_samples_per_second": 557.292, "eval_steps_per_second": 8.941, "step": 636 }, { "epoch": 7.0, "grad_norm": 1.0250859260559082, "learning_rate": 4.6500000000000005e-05, "loss": 0.1745, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7466666666666666, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.691358024691358, "eval_LOCATION_recall": 0.8115942028985508, "eval_ORGANIZATION_f1": 0.6122448979591837, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5232558139534884, "eval_ORGANIZATION_recall": 0.7377049180327869, "eval_PERSON_f1": 0.8385093167701864, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.7988165680473372, "eval_PERSON_recall": 0.8823529411764706, "eval_QUANTITY_f1": 0.6216216216216217, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5476190476190477, "eval_QUANTITY_recall": 0.71875, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15598997473716736, "eval_overall_accuracy": 0.9512013871686896, "eval_overall_f1": 0.7566137566137565, "eval_overall_precision": 0.697560975609756, "eval_overall_recall": 0.8265895953757225, "eval_runtime": 0.3325, "eval_samples_per_second": 562.394, "eval_steps_per_second": 9.022, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.9757563471794128, "learning_rate": 4.600000000000001e-05, "loss": 0.158, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6344827586206897, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5476190476190477, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.8411214953271029, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8035714285714286, "eval_PERSON_recall": 0.8823529411764706, "eval_QUANTITY_f1": 0.6301369863013699, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5609756097560976, "eval_QUANTITY_recall": 0.71875, "eval_TIME_f1": 0.7536231884057972, "eval_TIME_number": 31, "eval_TIME_precision": 0.6842105263157895, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.15038101375102997, "eval_overall_accuracy": 0.9521922219469904, "eval_overall_f1": 0.7595269382391591, "eval_overall_precision": 0.6963855421686747, "eval_overall_recall": 0.8352601156069365, "eval_runtime": 0.3277, "eval_samples_per_second": 570.677, "eval_steps_per_second": 9.155, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.060363531112671, "learning_rate": 4.55e-05, "loss": 0.1464, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.7692307692307693, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6896551724137931, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6153846153846154, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5365853658536586, "eval_ORGANIZATION_recall": 0.7213114754098361, "eval_PERSON_f1": 0.8490566037735848, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8181818181818182, "eval_PERSON_recall": 0.8823529411764706, "eval_QUANTITY_f1": 0.6666666666666665, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.75, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14481940865516663, "eval_overall_accuracy": 0.9529353480307159, "eval_overall_f1": 0.7655629139072848, "eval_overall_precision": 0.706601466992665, "eval_overall_recall": 0.8352601156069365, "eval_runtime": 0.3329, "eval_samples_per_second": 561.801, "eval_steps_per_second": 9.013, "step": 954 }, { "epoch": 10.0, "grad_norm": 0.9707283973693848, "learning_rate": 4.5e-05, "loss": 0.14, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.786206896551724, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.6222222222222222, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5675675675675675, "eval_ORGANIZATION_recall": 0.6885245901639344, "eval_PERSON_f1": 0.8444444444444443, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8209876543209876, "eval_PERSON_recall": 0.869281045751634, "eval_QUANTITY_f1": 0.7246376811594203, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13176114857196808, "eval_overall_accuracy": 0.9583849393113698, "eval_overall_f1": 0.7770177838577291, "eval_overall_precision": 0.7376623376623377, "eval_overall_recall": 0.8208092485549133, "eval_runtime": 0.3277, "eval_samples_per_second": 570.689, "eval_steps_per_second": 9.155, "step": 1060 }, { "epoch": 11.0, "grad_norm": 0.8272536396980286, "learning_rate": 4.4500000000000004e-05, "loss": 0.1336, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7662337662337662, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6941176470588235, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6259541984732824, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5857142857142857, "eval_ORGANIZATION_recall": 0.6721311475409836, "eval_PERSON_f1": 0.860759493670886, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.8888888888888888, "eval_QUANTITY_f1": 0.6575342465753423, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5853658536585366, "eval_QUANTITY_recall": 0.75, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13256430625915527, "eval_overall_accuracy": 0.955907852365618, "eval_overall_f1": 0.7735849056603774, "eval_overall_precision": 0.7247474747474747, "eval_overall_recall": 0.8294797687861272, "eval_runtime": 0.3322, "eval_samples_per_second": 562.93, "eval_steps_per_second": 9.031, "step": 1166 }, { "epoch": 12.0, "grad_norm": 2.3991382122039795, "learning_rate": 4.4000000000000006e-05, "loss": 0.126, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.7894736842105263, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6616541353383459, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.7213114754098361, "eval_PERSON_f1": 0.8695652173913043, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8284023668639053, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.6486486486486486, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5714285714285714, "eval_QUANTITY_recall": 0.75, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13229668140411377, "eval_overall_accuracy": 0.9568986871439188, "eval_overall_f1": 0.7887700534759359, "eval_overall_precision": 0.7338308457711443, "eval_overall_recall": 0.8526011560693642, "eval_runtime": 0.3344, "eval_samples_per_second": 559.23, "eval_steps_per_second": 8.972, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.8172109723091125, "learning_rate": 4.35e-05, "loss": 0.1209, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6808510638297871, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.8687500000000001, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8323353293413174, "eval_PERSON_recall": 0.9084967320261438, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12979264557361603, "eval_overall_accuracy": 0.9601189001733961, "eval_overall_f1": 0.8026845637583893, "eval_overall_precision": 0.7493734335839599, "eval_overall_recall": 0.8641618497109826, "eval_runtime": 0.3357, "eval_samples_per_second": 557.123, "eval_steps_per_second": 8.938, "step": 1378 }, { "epoch": 14.0, "grad_norm": 1.386945366859436, "learning_rate": 4.3e-05, "loss": 0.1172, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6883116883116883, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5698924731182796, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8650306748466258, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.815028901734104, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.6486486486486486, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.5714285714285714, "eval_QUANTITY_recall": 0.75, "eval_TIME_f1": 0.7536231884057972, "eval_TIME_number": 31, "eval_TIME_precision": 0.6842105263157895, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14491254091262817, "eval_overall_accuracy": 0.9529353480307159, "eval_overall_f1": 0.7839586028460543, "eval_overall_precision": 0.7096018735362998, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3283, "eval_samples_per_second": 569.521, "eval_steps_per_second": 9.137, "step": 1484 }, { "epoch": 15.0, "grad_norm": 0.46282199025154114, "learning_rate": 4.25e-05, "loss": 0.1135, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6969696969696969, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.647887323943662, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.8580441640378549, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8292682926829268, "eval_PERSON_recall": 0.8888888888888888, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12623363733291626, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8032786885245903, "eval_overall_precision": 0.7616580310880829, "eval_overall_recall": 0.8497109826589595, "eval_runtime": 0.3327, "eval_samples_per_second": 562.012, "eval_steps_per_second": 9.016, "step": 1590 }, { "epoch": 16.0, "grad_norm": 0.5779574513435364, "learning_rate": 4.2e-05, "loss": 0.1087, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.620253164556962, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.8624999999999999, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8263473053892215, "eval_PERSON_recall": 0.9019607843137255, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1268586367368698, "eval_overall_accuracy": 0.9611097349516968, "eval_overall_f1": 0.8070175438596492, "eval_overall_precision": 0.7569620253164557, "eval_overall_recall": 0.8641618497109826, "eval_runtime": 0.326, "eval_samples_per_second": 573.612, "eval_steps_per_second": 9.202, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.2563510537147522, "learning_rate": 4.15e-05, "loss": 0.1041, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7375886524822695, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.8652037617554859, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8313253012048193, "eval_PERSON_recall": 0.9019607843137255, "eval_QUANTITY_f1": 0.7027027027027026, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6190476190476191, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13557660579681396, "eval_overall_accuracy": 0.9583849393113698, "eval_overall_f1": 0.8079999999999999, "eval_overall_precision": 0.75, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3329, "eval_samples_per_second": 561.696, "eval_steps_per_second": 9.011, "step": 1802 }, { "epoch": 18.0, "grad_norm": 2.330004930496216, "learning_rate": 4.1e-05, "loss": 0.102, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6818181818181818, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6338028169014085, "eval_ORGANIZATION_recall": 0.7377049180327869, "eval_PERSON_f1": 0.8643533123028391, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.8954248366013072, "eval_QUANTITY_f1": 0.7246376811594203, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.128007709980011, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.7994542974079127, "eval_overall_precision": 0.7571059431524548, "eval_overall_recall": 0.846820809248555, "eval_runtime": 0.3322, "eval_samples_per_second": 562.934, "eval_steps_per_second": 9.031, "step": 1908 }, { "epoch": 19.0, "grad_norm": 1.4404404163360596, "learning_rate": 4.05e-05, "loss": 0.0999, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.8299319727891156, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6715328467153285, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6052631578947368, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.8706624605678233, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.9019607843137255, "eval_QUANTITY_f1": 0.6857142857142857, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.631578947368421, "eval_QUANTITY_recall": 0.75, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12171030044555664, "eval_overall_accuracy": 0.9623482784245727, "eval_overall_f1": 0.8043478260869564, "eval_overall_precision": 0.7589743589743589, "eval_overall_recall": 0.8554913294797688, "eval_runtime": 0.3267, "eval_samples_per_second": 572.375, "eval_steps_per_second": 9.182, "step": 2014 }, { "epoch": 20.0, "grad_norm": 0.6656851768493652, "learning_rate": 4e-05, "loss": 0.0942, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.7894736842105263, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7391304347826089, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6623376623376623, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8757763975155279, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.834319526627219, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.782608695652174, "eval_TIME_number": 31, "eval_TIME_precision": 0.7105263157894737, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13243292272090912, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.8100929614873839, "eval_overall_precision": 0.7493857493857494, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3326, "eval_samples_per_second": 562.253, "eval_steps_per_second": 9.02, "step": 2120 }, { "epoch": 21.0, "grad_norm": 0.6464937329292297, "learning_rate": 3.9500000000000005e-05, "loss": 0.0932, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.7770700636942676, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6931818181818182, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7361111111111112, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6385542168674698, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8730650154798762, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8294117647058824, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.6944444444444444, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.625, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.7647058823529411, "eval_TIME_number": 31, "eval_TIME_precision": 0.7027027027027027, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14281630516052246, "eval_overall_accuracy": 0.9564032697547684, "eval_overall_f1": 0.8010471204188482, "eval_overall_precision": 0.7320574162679426, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3327, "eval_samples_per_second": 561.987, "eval_steps_per_second": 9.016, "step": 2226 }, { "epoch": 22.0, "grad_norm": 1.1358213424682617, "learning_rate": 3.9000000000000006e-05, "loss": 0.0916, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7445255474452555, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6710526315789473, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8785046728971961, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8392857142857143, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.12807393074035645, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.8200270635994588, "eval_overall_precision": 0.7709923664122137, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3327, "eval_samples_per_second": 562.083, "eval_steps_per_second": 9.017, "step": 2332 }, { "epoch": 23.0, "grad_norm": 0.7238495945930481, "learning_rate": 3.85e-05, "loss": 0.0892, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8163265306122449, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7445255474452555, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6710526315789473, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.844311377245509, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.1260461062192917, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.8216216216216216, "eval_overall_precision": 0.7715736040609137, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3325, "eval_samples_per_second": 562.346, "eval_steps_per_second": 9.022, "step": 2438 }, { "epoch": 24.0, "grad_norm": 1.773553490638733, "learning_rate": 3.8e-05, "loss": 0.0865, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.7692307692307693, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6896551724137931, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7412587412587412, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6463414634146342, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.844311377245509, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7647058823529411, "eval_TIME_number": 31, "eval_TIME_precision": 0.7027027027027027, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14333529770374298, "eval_overall_accuracy": 0.9578895219222194, "eval_overall_f1": 0.8073878627968338, "eval_overall_precision": 0.7427184466019418, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.333, "eval_samples_per_second": 561.546, "eval_steps_per_second": 9.009, "step": 2544 }, { "epoch": 25.0, "grad_norm": 1.2657068967819214, "learning_rate": 3.7500000000000003e-05, "loss": 0.0834, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7746478873239437, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.9016393442622951, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13225042819976807, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8246318607764391, "eval_overall_precision": 0.7680798004987531, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3265, "eval_samples_per_second": 572.661, "eval_steps_per_second": 9.187, "step": 2650 }, { "epoch": 26.0, "grad_norm": 1.338986873626709, "learning_rate": 3.7e-05, "loss": 0.0823, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7638888888888888, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6626506024096386, "eval_ORGANIZATION_recall": 0.9016393442622951, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13243231177330017, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.8273092369477911, "eval_overall_precision": 0.770573566084788, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.332, "eval_samples_per_second": 563.211, "eval_steps_per_second": 9.035, "step": 2756 }, { "epoch": 27.0, "grad_norm": 1.9946244955062866, "learning_rate": 3.65e-05, "loss": 0.0809, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7391304347826089, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6623376623376623, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8832807570977917, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13205386698246002, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.8216216216216216, "eval_overall_precision": 0.7715736040609137, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3268, "eval_samples_per_second": 572.171, "eval_steps_per_second": 9.179, "step": 2862 }, { "epoch": 28.0, "grad_norm": 1.337754487991333, "learning_rate": 3.6e-05, "loss": 0.0793, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6766917293233082, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.7377049180327869, "eval_PERSON_f1": 0.8867924528301887, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8545454545454545, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.1275886595249176, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.809782608695652, "eval_overall_precision": 0.764102564102564, "eval_overall_recall": 0.861271676300578, "eval_runtime": 0.3333, "eval_samples_per_second": 561.108, "eval_steps_per_second": 9.002, "step": 2968 }, { "epoch": 29.0, "grad_norm": 1.4286695718765259, "learning_rate": 3.55e-05, "loss": 0.0759, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7428571428571428, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6582278481012658, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.880503144654088, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13053637742996216, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.8205128205128205, "eval_overall_precision": 0.769620253164557, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3332, "eval_samples_per_second": 561.235, "eval_steps_per_second": 9.004, "step": 3074 }, { "epoch": 30.0, "grad_norm": 1.020611047744751, "learning_rate": 3.5e-05, "loss": 0.0742, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7164179104477612, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6857142857142857, "eval_QUANTITY_recall": 0.75, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13522376120090485, "eval_overall_accuracy": 0.9596234827842457, "eval_overall_f1": 0.8139223560910309, "eval_overall_precision": 0.7581047381546134, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.334, "eval_samples_per_second": 559.963, "eval_steps_per_second": 8.983, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.5647078156471252, "learning_rate": 3.45e-05, "loss": 0.0755, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7014925373134328, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6438356164383562, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.8777429467084639, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8433734939759037, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12345639616250992, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.8125000000000001, "eval_overall_precision": 0.7666666666666667, "eval_overall_recall": 0.8641618497109826, "eval_runtime": 0.326, "eval_samples_per_second": 573.599, "eval_steps_per_second": 9.202, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.8619909286499023, "learning_rate": 3.4000000000000007e-05, "loss": 0.0709, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.7919463087248322, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.8832807570977917, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.126638263463974, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.8209959623149394, "eval_overall_precision": 0.7682619647355163, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3268, "eval_samples_per_second": 572.145, "eval_steps_per_second": 9.179, "step": 3392 }, { "epoch": 33.0, "grad_norm": 3.400688886642456, "learning_rate": 3.35e-05, "loss": 0.0711, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.8163265306122449, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.762589928057554, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6794871794871795, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8832807570977917, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7352941176470588, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6944444444444444, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.8125, "eval_TIME_number": 31, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.12633301317691803, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8272108843537415, "eval_overall_precision": 0.781491002570694, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3276, "eval_samples_per_second": 570.79, "eval_steps_per_second": 9.157, "step": 3498 }, { "epoch": 34.0, "grad_norm": 0.6063269376754761, "learning_rate": 3.3e-05, "loss": 0.0698, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.7947019867549668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8875000000000001, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8502994011976048, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13981756567955017, "eval_overall_accuracy": 0.9591280653950953, "eval_overall_f1": 0.8132450331125827, "eval_overall_precision": 0.7506112469437652, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3327, "eval_samples_per_second": 562.139, "eval_steps_per_second": 9.018, "step": 3604 }, { "epoch": 35.0, "grad_norm": 2.01218843460083, "learning_rate": 3.2500000000000004e-05, "loss": 0.0669, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6987951807228916, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7248322147651006, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6136363636363636, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.8895899053627759, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8597560975609756, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8125, "eval_TIME_number": 31, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.1391025334596634, "eval_overall_accuracy": 0.958632648005945, "eval_overall_f1": 0.8100929614873839, "eval_overall_precision": 0.7493857493857494, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3328, "eval_samples_per_second": 561.911, "eval_steps_per_second": 9.015, "step": 3710 }, { "epoch": 36.0, "grad_norm": 0.48844727873802185, "learning_rate": 3.2000000000000005e-05, "loss": 0.0659, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7310344827586208, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6309523809523809, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8930817610062893, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8606060606060606, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13162988424301147, "eval_overall_accuracy": 0.9623482784245727, "eval_overall_f1": 0.8192771084337348, "eval_overall_precision": 0.7630922693266833, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3328, "eval_samples_per_second": 561.896, "eval_steps_per_second": 9.014, "step": 3816 }, { "epoch": 37.0, "grad_norm": 1.3096176385879517, "learning_rate": 3.15e-05, "loss": 0.0627, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7297297297297297, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6206896551724138, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.8895899053627759, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8597560975609756, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13473619520664215, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8186666666666668, "eval_overall_precision": 0.7599009900990099, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3342, "eval_samples_per_second": 559.531, "eval_steps_per_second": 8.976, "step": 3922 }, { "epoch": 38.0, "grad_norm": 0.9041996598243713, "learning_rate": 3.1e-05, "loss": 0.0627, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7412587412587412, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6463414634146342, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 31, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13561618328094482, "eval_overall_accuracy": 0.9621005697299975, "eval_overall_f1": 0.8219544846050869, "eval_overall_precision": 0.7655860349127181, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3327, "eval_samples_per_second": 562.038, "eval_steps_per_second": 9.017, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.9759089350700378, "learning_rate": 3.05e-05, "loss": 0.0592, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.8299319727891156, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7246376811594203, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6493506493506493, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.880503144654088, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1278260350227356, "eval_overall_accuracy": 0.964082239286599, "eval_overall_f1": 0.8283378746594006, "eval_overall_precision": 0.7835051546391752, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3329, "eval_samples_per_second": 561.813, "eval_steps_per_second": 9.013, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.8231136798858643, "learning_rate": 3e-05, "loss": 0.06, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.7581699346405228, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.6904761904761905, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7375886524822695, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.880503144654088, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8125, "eval_TIME_number": 31, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.13648688793182373, "eval_overall_accuracy": 0.9598711914788209, "eval_overall_f1": 0.8085676037483266, "eval_overall_precision": 0.7531172069825436, "eval_overall_recall": 0.8728323699421965, "eval_runtime": 0.3327, "eval_samples_per_second": 562.148, "eval_steps_per_second": 9.018, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.8856554627418518, "learning_rate": 2.95e-05, "loss": 0.0583, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7586206896551725, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6547619047619048, "eval_ORGANIZATION_recall": 0.9016393442622951, "eval_PERSON_f1": 0.8819875776397514, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8402366863905325, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8125, "eval_TIME_number": 31, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.1364709734916687, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.822429906542056, "eval_overall_precision": 0.7642679900744417, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3319, "eval_samples_per_second": 563.438, "eval_steps_per_second": 9.039, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.7966371178627014, "learning_rate": 2.9e-05, "loss": 0.0592, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7482993197278911, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6395348837209303, "eval_ORGANIZATION_recall": 0.9016393442622951, "eval_PERSON_f1": 0.896551724137931, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8614457831325302, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14667053520679474, "eval_overall_accuracy": 0.9593757740896706, "eval_overall_f1": 0.824468085106383, "eval_overall_precision": 0.7635467980295566, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3276, "eval_samples_per_second": 570.779, "eval_steps_per_second": 9.157, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.6787899732589722, "learning_rate": 2.8499999999999998e-05, "loss": 0.0584, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7092198581560285, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8875000000000001, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8502994011976048, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7123287671232876, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6341463414634146, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.787878787878788, "eval_TIME_number": 31, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14089816808700562, "eval_overall_accuracy": 0.9591280653950953, "eval_overall_f1": 0.8133333333333334, "eval_overall_precision": 0.754950495049505, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3317, "eval_samples_per_second": 563.793, "eval_steps_per_second": 9.045, "step": 4558 }, { "epoch": 44.0, "grad_norm": 1.8825234174728394, "learning_rate": 2.8000000000000003e-05, "loss": 0.0571, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7361111111111112, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6385542168674698, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8832807570977917, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1371491551399231, "eval_overall_accuracy": 0.9621005697299975, "eval_overall_f1": 0.8209959623149394, "eval_overall_precision": 0.7682619647355163, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3331, "eval_samples_per_second": 561.467, "eval_steps_per_second": 9.007, "step": 4664 }, { "epoch": 45.0, "grad_norm": 1.0761770009994507, "learning_rate": 2.7500000000000004e-05, "loss": 0.0568, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8163265306122449, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7692307692307693, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.75177304964539, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6625, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.879746835443038, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.852760736196319, "eval_PERSON_recall": 0.9084967320261438, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8709677419354839, "eval_TIME_number": 31, "eval_TIME_precision": 0.8709677419354839, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1322641521692276, "eval_overall_accuracy": 0.9633391132028735, "eval_overall_f1": 0.8310626702997275, "eval_overall_precision": 0.7860824742268041, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3327, "eval_samples_per_second": 562.056, "eval_steps_per_second": 9.017, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.5931002497673035, "learning_rate": 2.7000000000000002e-05, "loss": 0.0518, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7361111111111112, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6385542168674698, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8924050632911392, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8650306748466258, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7142857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6578947368421053, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14024412631988525, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8165997322623829, "eval_overall_precision": 0.7605985037406484, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3334, "eval_samples_per_second": 560.842, "eval_steps_per_second": 8.997, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.7838124632835388, "learning_rate": 2.6500000000000004e-05, "loss": 0.0529, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.7919463087248322, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7310344827586208, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6309523809523809, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8832807570977917, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7246376811594203, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6756756756756757, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1365956962108612, "eval_overall_accuracy": 0.9621005697299975, "eval_overall_f1": 0.8172043010752688, "eval_overall_precision": 0.7638190954773869, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3326, "eval_samples_per_second": 562.284, "eval_steps_per_second": 9.021, "step": 4982 }, { "epoch": 48.0, "grad_norm": 1.4798297882080078, "learning_rate": 2.6000000000000002e-05, "loss": 0.0516, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7153284671532848, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6447368421052632, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.880503144654088, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14157778024673462, "eval_overall_accuracy": 0.9598711914788209, "eval_overall_f1": 0.8167115902964959, "eval_overall_precision": 0.7651515151515151, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3333, "eval_samples_per_second": 561.042, "eval_steps_per_second": 9.001, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.9078386425971985, "learning_rate": 2.5500000000000003e-05, "loss": 0.0524, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7285714285714285, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6455696202531646, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8930817610062893, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8606060606060606, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14155249297618866, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.8286099865047234, "eval_overall_precision": 0.7772151898734178, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3319, "eval_samples_per_second": 563.426, "eval_steps_per_second": 9.039, "step": 5194 }, { "epoch": 50.0, "grad_norm": 1.6509796380996704, "learning_rate": 2.5e-05, "loss": 0.0494, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7445255474452555, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6710526315789473, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8867924528301887, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8545454545454545, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1381203830242157, "eval_overall_accuracy": 0.9621005697299975, "eval_overall_f1": 0.8254397834912043, "eval_overall_precision": 0.7760814249363868, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3345, "eval_samples_per_second": 559.02, "eval_steps_per_second": 8.968, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.7626707553863525, "learning_rate": 2.45e-05, "loss": 0.0478, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.8243243243243245, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7297297297297297, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6206896551724138, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.8867924528301887, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8545454545454545, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14348609745502472, "eval_overall_accuracy": 0.9623482784245727, "eval_overall_f1": 0.8310991957104559, "eval_overall_precision": 0.775, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3315, "eval_samples_per_second": 564.037, "eval_steps_per_second": 9.049, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.5748308300971985, "learning_rate": 2.4e-05, "loss": 0.0485, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.8356164383561644, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7922077922077922, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.632183908045977, "eval_ORGANIZATION_recall": 0.9016393442622951, "eval_PERSON_f1": 0.8867924528301887, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8545454545454545, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14024515450000763, "eval_overall_accuracy": 0.9625959871191478, "eval_overall_f1": 0.836021505376344, "eval_overall_precision": 0.7814070351758794, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3324, "eval_samples_per_second": 562.57, "eval_steps_per_second": 9.025, "step": 5512 }, { "epoch": 53.0, "grad_norm": 1.001908779144287, "learning_rate": 2.35e-05, "loss": 0.0475, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.8356164383561644, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7922077922077922, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.13823822140693665, "eval_overall_accuracy": 0.9630914045082982, "eval_overall_f1": 0.8313090418353577, "eval_overall_precision": 0.779746835443038, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3335, "eval_samples_per_second": 560.779, "eval_steps_per_second": 8.996, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.5605162382125854, "learning_rate": 2.3000000000000003e-05, "loss": 0.0481, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.7919463087248322, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7285714285714285, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6455696202531646, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8867924528301887, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8545454545454545, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.75, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14209988713264465, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8209959623149394, "eval_overall_precision": 0.7682619647355163, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3329, "eval_samples_per_second": 561.696, "eval_steps_per_second": 9.011, "step": 5724 }, { "epoch": 55.0, "grad_norm": 1.0782426595687866, "learning_rate": 2.25e-05, "loss": 0.0474, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.8299319727891156, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7432432432432433, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.632183908045977, "eval_ORGANIZATION_recall": 0.9016393442622951, "eval_PERSON_f1": 0.8909657320872275, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8511904761904762, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14407247304916382, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.8346666666666667, "eval_overall_precision": 0.7747524752475248, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3328, "eval_samples_per_second": 561.974, "eval_steps_per_second": 9.016, "step": 5830 }, { "epoch": 56.0, "grad_norm": 2.055668592453003, "learning_rate": 2.2000000000000003e-05, "loss": 0.0456, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7153284671532848, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6447368421052632, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.8930817610062893, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8606060606060606, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.75, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14129342138767242, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8183041722745625, "eval_overall_precision": 0.7657430730478589, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3322, "eval_samples_per_second": 562.981, "eval_steps_per_second": 9.032, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.7829787135124207, "learning_rate": 2.15e-05, "loss": 0.0451, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7428571428571428, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6582278481012658, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.89375, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8562874251497006, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14520226418972015, "eval_overall_accuracy": 0.9625959871191478, "eval_overall_f1": 0.8268456375838926, "eval_overall_precision": 0.7719298245614035, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3271, "eval_samples_per_second": 571.771, "eval_steps_per_second": 9.173, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.2567724287509918, "learning_rate": 2.1e-05, "loss": 0.0437, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7222222222222222, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6265060240963856, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.8958990536277602, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8658536585365854, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14597974717617035, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.8219544846050869, "eval_overall_precision": 0.7655860349127181, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3323, "eval_samples_per_second": 562.69, "eval_steps_per_second": 9.027, "step": 6148 }, { "epoch": 59.0, "grad_norm": 0.4437527656555176, "learning_rate": 2.05e-05, "loss": 0.0424, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7272727272727272, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6341463414634146, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.8875000000000001, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8502994011976048, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1500689834356308, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.8186666666666668, "eval_overall_precision": 0.7599009900990099, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3324, "eval_samples_per_second": 562.659, "eval_steps_per_second": 9.027, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.7316974997520447, "learning_rate": 2e-05, "loss": 0.0423, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7210884353741497, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6162790697674418, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8847352024922119, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8452380952380952, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7323943661971831, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15397267043590546, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.8169761273209548, "eval_overall_precision": 0.7549019607843137, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3265, "eval_samples_per_second": 572.825, "eval_steps_per_second": 9.19, "step": 6360 }, { "epoch": 61.0, "grad_norm": 0.7264176607131958, "learning_rate": 1.9500000000000003e-05, "loss": 0.041, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.147948756814003, "eval_overall_accuracy": 0.9611097349516968, "eval_overall_f1": 0.8208556149732621, "eval_overall_precision": 0.763681592039801, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3335, "eval_samples_per_second": 560.648, "eval_steps_per_second": 8.994, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.7140088677406311, "learning_rate": 1.9e-05, "loss": 0.0405, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8847352024922119, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8452380952380952, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.148734450340271, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8150134048257373, "eval_overall_precision": 0.76, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.333, "eval_samples_per_second": 561.598, "eval_steps_per_second": 9.01, "step": 6572 }, { "epoch": 63.0, "grad_norm": 1.8145302534103394, "learning_rate": 1.85e-05, "loss": 0.0394, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.8902821316614421, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8554216867469879, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14801925420761108, "eval_overall_accuracy": 0.9625959871191478, "eval_overall_f1": 0.8241610738255033, "eval_overall_precision": 0.7694235588972431, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3325, "eval_samples_per_second": 562.37, "eval_steps_per_second": 9.022, "step": 6678 }, { "epoch": 64.0, "grad_norm": 1.2566087245941162, "learning_rate": 1.8e-05, "loss": 0.0384, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7346938775510204, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.627906976744186, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.89375, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8562874251497006, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15676021575927734, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.824468085106383, "eval_overall_precision": 0.7635467980295566, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.333, "eval_samples_per_second": 561.621, "eval_steps_per_second": 9.01, "step": 6784 }, { "epoch": 65.0, "grad_norm": 1.431575894355774, "learning_rate": 1.75e-05, "loss": 0.0397, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6993006993006993, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6097560975609756, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8785046728971961, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8392857142857143, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7605633802816902, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6923076923076923, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14874185621738434, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.8170894526034712, "eval_overall_precision": 0.7593052109181141, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3264, "eval_samples_per_second": 572.977, "eval_steps_per_second": 9.192, "step": 6890 }, { "epoch": 66.0, "grad_norm": 1.1114250421524048, "learning_rate": 1.7000000000000003e-05, "loss": 0.0388, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7074829931972788, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6046511627906976, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.8916408668730651, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8470588235294118, "eval_PERSON_recall": 0.9411764705882353, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1624731570482254, "eval_overall_accuracy": 0.9601189001733961, "eval_overall_f1": 0.8153034300791557, "eval_overall_precision": 0.75, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3323, "eval_samples_per_second": 562.754, "eval_steps_per_second": 9.028, "step": 6996 }, { "epoch": 67.0, "grad_norm": 2.434706926345825, "learning_rate": 1.65e-05, "loss": 0.0402, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.8026315789473685, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7123287671232876, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.611764705882353, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.8909657320872275, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8511904761904762, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.75, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1620258390903473, "eval_overall_accuracy": 0.9596234827842457, "eval_overall_f1": 0.8201058201058201, "eval_overall_precision": 0.7560975609756098, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3325, "eval_samples_per_second": 562.349, "eval_steps_per_second": 9.022, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.43614867329597473, "learning_rate": 1.6000000000000003e-05, "loss": 0.0397, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7183098591549297, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6296296296296297, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1530744731426239, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.8155080213903744, "eval_overall_precision": 0.7587064676616916, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.328, "eval_samples_per_second": 570.186, "eval_steps_per_second": 9.147, "step": 7208 }, { "epoch": 69.0, "grad_norm": 1.2761048078536987, "learning_rate": 1.55e-05, "loss": 0.0383, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7034482758620689, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6071428571428571, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8847352024922119, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8452380952380952, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15172313153743744, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.8219544846050869, "eval_overall_precision": 0.7655860349127181, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3319, "eval_samples_per_second": 563.458, "eval_steps_per_second": 9.039, "step": 7314 }, { "epoch": 70.0, "grad_norm": 1.8664883375167847, "learning_rate": 1.5e-05, "loss": 0.0375, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7172413793103448, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6190476190476191, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.8875000000000001, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8502994011976048, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1547580361366272, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8208556149732621, "eval_overall_precision": 0.763681592039801, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3256, "eval_samples_per_second": 574.274, "eval_steps_per_second": 9.213, "step": 7420 }, { "epoch": 71.0, "grad_norm": 2.3128960132598877, "learning_rate": 1.45e-05, "loss": 0.0368, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.689655172413793, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5952380952380952, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15528355538845062, "eval_overall_accuracy": 0.9598711914788209, "eval_overall_f1": 0.8117489986648866, "eval_overall_precision": 0.7543424317617866, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3322, "eval_samples_per_second": 562.889, "eval_steps_per_second": 9.03, "step": 7526 }, { "epoch": 72.0, "grad_norm": 2.342613458633423, "learning_rate": 1.4000000000000001e-05, "loss": 0.0375, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.844311377245509, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15482325851917267, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.8150134048257373, "eval_overall_precision": 0.76, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3322, "eval_samples_per_second": 562.879, "eval_steps_per_second": 9.03, "step": 7632 }, { "epoch": 73.0, "grad_norm": 2.5355284214019775, "learning_rate": 1.3500000000000001e-05, "loss": 0.0364, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.6950354609929078, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6125, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.844311377245509, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15112702548503876, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.811320754716981, "eval_overall_precision": 0.76010101010101, "eval_overall_recall": 0.869942196531792, "eval_runtime": 0.3265, "eval_samples_per_second": 572.81, "eval_steps_per_second": 9.189, "step": 7738 }, { "epoch": 74.0, "grad_norm": 2.763317108154297, "learning_rate": 1.3000000000000001e-05, "loss": 0.0356, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6944444444444445, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6024096385542169, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.844311377245509, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15702202916145325, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8128342245989304, "eval_overall_precision": 0.7562189054726368, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3325, "eval_samples_per_second": 562.361, "eval_steps_per_second": 9.022, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.9147346615791321, "learning_rate": 1.25e-05, "loss": 0.0345, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.8053691275167786, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7132867132867133, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6219512195121951, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8875000000000001, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8502994011976048, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.160079225897789, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.8192771084337348, "eval_overall_precision": 0.7630922693266833, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3259, "eval_samples_per_second": 573.758, "eval_steps_per_second": 9.205, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.9755911827087402, "learning_rate": 1.2e-05, "loss": 0.0358, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7172413793103448, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6190476190476191, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.844311377245509, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15988942980766296, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.816, "eval_overall_precision": 0.7574257425742574, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3322, "eval_samples_per_second": 562.905, "eval_steps_per_second": 9.031, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.6485092639923096, "learning_rate": 1.1500000000000002e-05, "loss": 0.0359, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7092198581560285, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15627126395702362, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.8236877523553163, "eval_overall_precision": 0.7707808564231738, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.333, "eval_samples_per_second": 561.64, "eval_steps_per_second": 9.01, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.8235780596733093, "learning_rate": 1.1000000000000001e-05, "loss": 0.0328, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7050359712230215, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6282051282051282, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15545301139354706, "eval_overall_accuracy": 0.9616051523408472, "eval_overall_f1": 0.8216216216216216, "eval_overall_precision": 0.7715736040609137, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3276, "eval_samples_per_second": 570.819, "eval_steps_per_second": 9.158, "step": 8268 }, { "epoch": 79.0, "grad_norm": 1.297727108001709, "learning_rate": 1.05e-05, "loss": 0.034, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7183098591549297, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6296296296296297, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1584213823080063, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8187919463087249, "eval_overall_precision": 0.7644110275689223, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3318, "eval_samples_per_second": 563.58, "eval_steps_per_second": 9.041, "step": 8374 }, { "epoch": 80.0, "grad_norm": 1.0464829206466675, "learning_rate": 1e-05, "loss": 0.0344, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.844311377245509, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15635241568088531, "eval_overall_accuracy": 0.9621005697299975, "eval_overall_f1": 0.8216216216216216, "eval_overall_precision": 0.7715736040609137, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3334, "eval_samples_per_second": 560.931, "eval_steps_per_second": 8.999, "step": 8480 }, { "epoch": 81.0, "grad_norm": 1.1984474658966064, "learning_rate": 9.5e-06, "loss": 0.0337, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6950354609929078, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6125, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.844311377245509, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16573630273342133, "eval_overall_accuracy": 0.9601189001733961, "eval_overall_f1": 0.8150134048257373, "eval_overall_precision": 0.76, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3335, "eval_samples_per_second": 560.721, "eval_steps_per_second": 8.996, "step": 8586 }, { "epoch": 82.0, "grad_norm": 1.3891063928604126, "learning_rate": 9e-06, "loss": 0.0331, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6986301369863014, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.88125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.844311377245509, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16680771112442017, "eval_overall_accuracy": 0.9601189001733961, "eval_overall_f1": 0.8186666666666668, "eval_overall_precision": 0.7599009900990099, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.326, "eval_samples_per_second": 573.602, "eval_steps_per_second": 9.202, "step": 8692 }, { "epoch": 83.0, "grad_norm": 1.0325218439102173, "learning_rate": 8.500000000000002e-06, "loss": 0.0328, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.880503144654088, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15955756604671478, "eval_overall_accuracy": 0.9611097349516968, "eval_overall_f1": 0.8167115902964959, "eval_overall_precision": 0.7651515151515151, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3325, "eval_samples_per_second": 562.469, "eval_steps_per_second": 9.024, "step": 8798 }, { "epoch": 84.0, "grad_norm": 1.833433747291565, "learning_rate": 8.000000000000001e-06, "loss": 0.0339, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.723404255319149, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6375, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15904375910758972, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8183041722745625, "eval_overall_precision": 0.7657430730478589, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3326, "eval_samples_per_second": 562.206, "eval_steps_per_second": 9.019, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.8579007983207703, "learning_rate": 7.5e-06, "loss": 0.0324, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6906474820143885, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6153846153846154, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.8742138364779874, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9084967320261438, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.15392935276031494, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8092016238159675, "eval_overall_precision": 0.7608142493638677, "eval_overall_recall": 0.8641618497109826, "eval_runtime": 0.3321, "eval_samples_per_second": 563.068, "eval_steps_per_second": 9.033, "step": 9010 }, { "epoch": 86.0, "grad_norm": 2.3941845893859863, "learning_rate": 7.000000000000001e-06, "loss": 0.0327, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6762589928057554, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6025641025641025, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.875, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8383233532934131, "eval_PERSON_recall": 0.9150326797385621, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1588955819606781, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8053691275167784, "eval_overall_precision": 0.7518796992481203, "eval_overall_recall": 0.8670520231213873, "eval_runtime": 0.3263, "eval_samples_per_second": 573.03, "eval_steps_per_second": 9.193, "step": 9116 }, { "epoch": 87.0, "grad_norm": 1.8358588218688965, "learning_rate": 6.5000000000000004e-06, "loss": 0.0318, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.723404255319149, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6375, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16152726113796234, "eval_overall_accuracy": 0.9611097349516968, "eval_overall_f1": 0.8198924731182795, "eval_overall_precision": 0.7663316582914573, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3317, "eval_samples_per_second": 563.682, "eval_steps_per_second": 9.043, "step": 9222 }, { "epoch": 88.0, "grad_norm": 2.0525128841400146, "learning_rate": 6e-06, "loss": 0.0311, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6906474820143885, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6153846153846154, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16066040098667145, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.8129205921938087, "eval_overall_precision": 0.760705289672544, "eval_overall_recall": 0.8728323699421965, "eval_runtime": 0.3324, "eval_samples_per_second": 562.545, "eval_steps_per_second": 9.025, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.892722487449646, "learning_rate": 5.500000000000001e-06, "loss": 0.033, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6956521739130435, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6233766233766234, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16328519582748413, "eval_overall_accuracy": 0.9601189001733961, "eval_overall_f1": 0.8118279569892471, "eval_overall_precision": 0.7587939698492462, "eval_overall_recall": 0.8728323699421965, "eval_runtime": 0.3318, "eval_samples_per_second": 563.6, "eval_steps_per_second": 9.042, "step": 9434 }, { "epoch": 90.0, "grad_norm": 1.3466918468475342, "learning_rate": 5e-06, "loss": 0.0314, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.7999999999999999, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.620253164556962, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1654297560453415, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8183041722745625, "eval_overall_precision": 0.7657430730478589, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3339, "eval_samples_per_second": 560.083, "eval_steps_per_second": 8.985, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.5831097960472107, "learning_rate": 4.5e-06, "loss": 0.0317, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.620253164556962, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16038751602172852, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8145161290322581, "eval_overall_precision": 0.7613065326633166, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3258, "eval_samples_per_second": 573.92, "eval_steps_per_second": 9.207, "step": 9646 }, { "epoch": 92.0, "grad_norm": 2.8795530796051025, "learning_rate": 4.000000000000001e-06, "loss": 0.0313, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16018863022327423, "eval_overall_accuracy": 0.961357443646272, "eval_overall_f1": 0.8156123822341858, "eval_overall_precision": 0.7632241813602015, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3325, "eval_samples_per_second": 562.323, "eval_steps_per_second": 9.021, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.9272975325584412, "learning_rate": 3.5000000000000004e-06, "loss": 0.0317, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16194607317447662, "eval_overall_accuracy": 0.9611097349516968, "eval_overall_f1": 0.8183041722745625, "eval_overall_precision": 0.7657430730478589, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3339, "eval_samples_per_second": 560.094, "eval_steps_per_second": 8.985, "step": 9858 }, { "epoch": 94.0, "grad_norm": 1.6155447959899902, "learning_rate": 3e-06, "loss": 0.0322, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7272727272727272, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6341463414634146, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16590212285518646, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.8203753351206433, "eval_overall_precision": 0.765, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.332, "eval_samples_per_second": 563.263, "eval_steps_per_second": 9.036, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.8714067339897156, "learning_rate": 2.5e-06, "loss": 0.0305, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6993006993006993, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6097560975609756, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16414810717105865, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.8128342245989304, "eval_overall_precision": 0.7562189054726368, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3262, "eval_samples_per_second": 573.227, "eval_steps_per_second": 9.196, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.7234588265419006, "learning_rate": 2.0000000000000003e-06, "loss": 0.0302, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7050359712230215, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6282051282051282, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1619059145450592, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.8167115902964959, "eval_overall_precision": 0.7651515151515151, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3323, "eval_samples_per_second": 562.669, "eval_steps_per_second": 9.027, "step": 10176 }, { "epoch": 97.0, "grad_norm": 1.2419594526290894, "learning_rate": 1.5e-06, "loss": 0.0309, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.7866666666666667, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7183098591549297, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6296296296296297, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1639154851436615, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.8187919463087249, "eval_overall_precision": 0.7644110275689223, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3326, "eval_samples_per_second": 562.252, "eval_steps_per_second": 9.02, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.3145425021648407, "learning_rate": 1.0000000000000002e-06, "loss": 0.0288, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6993006993006993, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6097560975609756, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.16421489417552948, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8139223560910309, "eval_overall_precision": 0.7581047381546134, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3325, "eval_samples_per_second": 562.38, "eval_steps_per_second": 9.022, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.6178627610206604, "learning_rate": 5.000000000000001e-07, "loss": 0.0307, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6901408450704226, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6049382716049383, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1645815670490265, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.8112449799196787, "eval_overall_precision": 0.7556109725685786, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.332, "eval_samples_per_second": 563.213, "eval_steps_per_second": 9.036, "step": 10494 }, { "epoch": 100.0, "grad_norm": 1.0940686464309692, "learning_rate": 0.0, "loss": 0.032, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6993006993006993, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6097560975609756, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.8840125391849529, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1641756296157837, "eval_overall_accuracy": 0.9603666088679713, "eval_overall_f1": 0.8128342245989304, "eval_overall_precision": 0.7562189054726368, "eval_overall_recall": 0.8786127167630058, "eval_runtime": 0.3326, "eval_samples_per_second": 562.318, "eval_steps_per_second": 9.021, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 4608467078884878.0, "train_loss": 0.08280598743906561, "train_runtime": 623.2047, "train_samples_per_second": 270.698, "train_steps_per_second": 17.009 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 4608467078884878.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }