{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 2.678309202194214, "learning_rate": 4.9500000000000004e-05, "loss": 0.9941, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.01183431952662722, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.05263157894736842, "eval_PERSON_recall": 0.006666666666666667, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.0689655172413793, "eval_TIME_number": 28, "eval_TIME_precision": 1.0, "eval_TIME_recall": 0.03571428571428571, "eval_loss": 0.5622514486312866, "eval_overall_accuracy": 0.8440834141610087, "eval_overall_f1": 0.010471204188481676, "eval_overall_precision": 0.05714285714285714, "eval_overall_recall": 0.005763688760806916, "eval_runtime": 0.3767, "eval_samples_per_second": 496.365, "eval_steps_per_second": 7.963, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.0868268013000488, "learning_rate": 4.9e-05, "loss": 0.4917, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.36036036036036034, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5, "eval_LOCATION_recall": 0.28169014084507044, "eval_ORGANIZATION_f1": 0.10909090909090909, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.13333333333333333, "eval_ORGANIZATION_recall": 0.09230769230769231, "eval_PERSON_f1": 0.7146974063400575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.6294416243654822, "eval_PERSON_recall": 0.8266666666666667, "eval_QUANTITY_f1": 0.125, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.12903225806451613, "eval_QUANTITY_recall": 0.12121212121212122, "eval_TIME_f1": 0.7164179104477612, "eval_TIME_number": 28, "eval_TIME_precision": 0.6153846153846154, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.34143543243408203, "eval_overall_accuracy": 0.9042192046556741, "eval_overall_f1": 0.5092989985693849, "eval_overall_precision": 0.5056818181818182, "eval_overall_recall": 0.5129682997118156, "eval_runtime": 0.3785, "eval_samples_per_second": 493.993, "eval_steps_per_second": 7.925, "step": 212 }, { "epoch": 3.0, "grad_norm": 0.8501033186912537, "learning_rate": 4.85e-05, "loss": 0.3079, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.6111111111111112, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6027397260273972, "eval_LOCATION_recall": 0.6197183098591549, "eval_ORGANIZATION_f1": 0.573170731707317, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.47474747474747475, "eval_ORGANIZATION_recall": 0.7230769230769231, "eval_PERSON_f1": 0.8173374613003096, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7630057803468208, "eval_PERSON_recall": 0.88, "eval_QUANTITY_f1": 0.5641025641025641, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.4888888888888889, "eval_QUANTITY_recall": 0.6666666666666666, "eval_TIME_f1": 0.7777777777777779, "eval_TIME_number": 28, "eval_TIME_precision": 0.8076923076923077, "eval_TIME_recall": 0.75, "eval_loss": 0.21354812383651733, "eval_overall_accuracy": 0.9277400581959263, "eval_overall_f1": 0.6972477064220184, "eval_overall_precision": 0.6394230769230769, "eval_overall_recall": 0.7665706051873199, "eval_runtime": 0.3794, "eval_samples_per_second": 492.831, "eval_steps_per_second": 7.906, "step": 318 }, { "epoch": 4.0, "grad_norm": 0.8237155079841614, "learning_rate": 4.8e-05, "loss": 0.2193, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.641025641025641, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5882352941176471, "eval_LOCATION_recall": 0.704225352112676, "eval_ORGANIZATION_f1": 0.6010928961748634, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.4661016949152542, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8395061728395062, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7816091954022989, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.5999999999999999, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5106382978723404, "eval_QUANTITY_recall": 0.7272727272727273, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17542287707328796, "eval_overall_accuracy": 0.9391367604267701, "eval_overall_f1": 0.7268170426065164, "eval_overall_precision": 0.6430155210643016, "eval_overall_recall": 0.8357348703170029, "eval_runtime": 0.3799, "eval_samples_per_second": 492.264, "eval_steps_per_second": 7.897, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.2984700202941895, "learning_rate": 4.75e-05, "loss": 0.1845, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.6708860759493671, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6091954022988506, "eval_LOCATION_recall": 0.7464788732394366, "eval_ORGANIZATION_f1": 0.6710526315789473, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5862068965517241, "eval_ORGANIZATION_recall": 0.7846153846153846, "eval_PERSON_f1": 0.8411214953271027, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7894736842105263, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.5952380952380952, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.49019607843137253, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.7419354838709677, "eval_TIME_number": 28, "eval_TIME_precision": 0.6764705882352942, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.15947341918945312, "eval_overall_accuracy": 0.944713870029098, "eval_overall_f1": 0.7387387387387387, "eval_overall_precision": 0.6674418604651163, "eval_overall_recall": 0.8270893371757925, "eval_runtime": 0.3795, "eval_samples_per_second": 492.809, "eval_steps_per_second": 7.906, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.3075064420700073, "learning_rate": 4.7e-05, "loss": 0.169, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.6785714285714287, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5876288659793815, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.6829268292682926, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5656565656565656, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8509316770186336, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7965116279069767, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6153846153846154, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.4827586206896552, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.676470588235294, "eval_TIME_number": 28, "eval_TIME_precision": 0.575, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.18737278878688812, "eval_overall_accuracy": 0.933074684772066, "eval_overall_f1": 0.7404674046740467, "eval_overall_precision": 0.6459227467811158, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3823, "eval_samples_per_second": 489.095, "eval_steps_per_second": 7.846, "step": 636 }, { "epoch": 7.0, "grad_norm": 2.091857433319092, "learning_rate": 4.6500000000000005e-05, "loss": 0.1587, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.732919254658385, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6555555555555556, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.6878980891719746, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5869565217391305, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8633540372670808, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8081395348837209, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6666666666666667, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5490196078431373, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 28, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15555286407470703, "eval_overall_accuracy": 0.9435014548981572, "eval_overall_f1": 0.7725540025412961, "eval_overall_precision": 0.6909090909090909, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.378, "eval_samples_per_second": 494.694, "eval_steps_per_second": 7.936, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.6778572201728821, "learning_rate": 4.600000000000001e-05, "loss": 0.1422, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7065868263473054, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6145833333333334, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.6792452830188681, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.574468085106383, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8634920634920634, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8242424242424242, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7179487179487178, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6222222222222222, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7384615384615384, "eval_TIME_number": 28, "eval_TIME_precision": 0.6486486486486487, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.142758309841156, "eval_overall_accuracy": 0.9483511154219205, "eval_overall_f1": 0.7678571428571429, "eval_overall_precision": 0.6887871853546911, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3796, "eval_samples_per_second": 492.664, "eval_steps_per_second": 7.904, "step": 848 }, { "epoch": 9.0, "grad_norm": 0.740088701248169, "learning_rate": 4.55e-05, "loss": 0.1362, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.708860759493671, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6021505376344086, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8726114649681529, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8353658536585366, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6666666666666667, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5490196078431373, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13845409452915192, "eval_overall_accuracy": 0.9515033947623667, "eval_overall_f1": 0.7890625, "eval_overall_precision": 0.7197149643705463, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3794, "eval_samples_per_second": 492.924, "eval_steps_per_second": 7.908, "step": 954 }, { "epoch": 10.0, "grad_norm": 1.7449586391448975, "learning_rate": 4.5e-05, "loss": 0.1321, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.7516778523489933, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.717948717948718, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.7019867549668873, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6162790697674418, "eval_ORGANIZATION_recall": 0.8153846153846154, "eval_PERSON_f1": 0.8690095846645367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7179487179487178, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6222222222222222, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 28, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12999238073825836, "eval_overall_accuracy": 0.9553831231813773, "eval_overall_f1": 0.7898936170212766, "eval_overall_precision": 0.7333333333333333, "eval_overall_recall": 0.8559077809798271, "eval_runtime": 0.3805, "eval_samples_per_second": 491.468, "eval_steps_per_second": 7.885, "step": 1060 }, { "epoch": 11.0, "grad_norm": 1.6345419883728027, "learning_rate": 4.4500000000000004e-05, "loss": 0.1217, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7096774193548387, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6111111111111112, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7088607594936709, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6086956521739131, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 28, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13535159826278687, "eval_overall_accuracy": 0.9512609117361784, "eval_overall_f1": 0.8005284015852047, "eval_overall_precision": 0.7390243902439024, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.38, "eval_samples_per_second": 492.12, "eval_steps_per_second": 7.895, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.6287707090377808, "learning_rate": 4.4000000000000006e-05, "loss": 0.1192, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.7643312101910827, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6976744186046512, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7261146496815286, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6195652173913043, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13359412550926208, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8068331143232589, "eval_overall_precision": 0.7415458937198067, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3781, "eval_samples_per_second": 494.638, "eval_steps_per_second": 7.935, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.46434441208839417, "learning_rate": 4.35e-05, "loss": 0.1138, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7204968944099378, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6041666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8802588996763754, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8553459119496856, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6585365853658536, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5510204081632653, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13541372120380402, "eval_overall_accuracy": 0.9527158098933075, "eval_overall_f1": 0.8005249343832022, "eval_overall_precision": 0.7349397590361446, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3812, "eval_samples_per_second": 490.62, "eval_steps_per_second": 7.871, "step": 1378 }, { "epoch": 14.0, "grad_norm": 2.5094404220581055, "learning_rate": 4.3e-05, "loss": 0.1103, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7236842105263158, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.632183908045977, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.675, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.574468085106383, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1337423026561737, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8064085447263017, "eval_overall_precision": 0.7512437810945274, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3799, "eval_samples_per_second": 492.18, "eval_steps_per_second": 7.896, "step": 1484 }, { "epoch": 15.0, "grad_norm": 0.8557437658309937, "learning_rate": 4.25e-05, "loss": 0.1038, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7272727272727273, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6292134831460674, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.675, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.574468085106383, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1362387090921402, "eval_overall_accuracy": 0.9546556741028128, "eval_overall_f1": 0.8031704095112285, "eval_overall_precision": 0.7414634146341463, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3807, "eval_samples_per_second": 491.261, "eval_steps_per_second": 7.881, "step": 1590 }, { "epoch": 16.0, "grad_norm": 1.1418652534484863, "learning_rate": 4.2e-05, "loss": 0.1016, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7333333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6585365853658536, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5510204081632653, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1373499035835266, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8042609853528628, "eval_overall_precision": 0.7475247524752475, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.3807, "eval_samples_per_second": 491.2, "eval_steps_per_second": 7.88, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.8007000684738159, "learning_rate": 4.15e-05, "loss": 0.1008, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.7837837837837838, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.728476821192053, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6395348837209303, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1264466941356659, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8123324396782842, "eval_overall_precision": 0.7593984962406015, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3813, "eval_samples_per_second": 490.475, "eval_steps_per_second": 7.869, "step": 1802 }, { "epoch": 18.0, "grad_norm": 0.6803272366523743, "learning_rate": 4.1e-05, "loss": 0.0961, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7044025157232704, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5957446808510638, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6666666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5625, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14231978356838226, "eval_overall_accuracy": 0.9541707080504365, "eval_overall_f1": 0.7936925098554534, "eval_overall_precision": 0.7294685990338164, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.38, "eval_samples_per_second": 492.088, "eval_steps_per_second": 7.894, "step": 1908 }, { "epoch": 19.0, "grad_norm": 0.7480773329734802, "learning_rate": 4.05e-05, "loss": 0.0927, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.7552447552447553, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.7605633802816901, "eval_ORGANIZATION_f1": 0.7483870967741936, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6444444444444445, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12808914482593536, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8113207547169812, "eval_overall_precision": 0.7620253164556962, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3783, "eval_samples_per_second": 494.38, "eval_steps_per_second": 7.931, "step": 2014 }, { "epoch": 20.0, "grad_norm": 0.7538065314292908, "learning_rate": 4e-05, "loss": 0.0896, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.7741935483870968, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7142857142857143, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7532467532467532, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.651685393258427, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.9090909090909091, "eval_TIME_number": 28, "eval_TIME_precision": 0.9259259259259259, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13772721588611603, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8170894526034712, "eval_overall_precision": 0.7611940298507462, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3854, "eval_samples_per_second": 485.188, "eval_steps_per_second": 7.784, "step": 2120 }, { "epoch": 21.0, "grad_norm": 1.0004348754882812, "learning_rate": 3.9500000000000005e-05, "loss": 0.0881, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7361963190184049, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6122448979591837, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6666666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5625, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14643645286560059, "eval_overall_accuracy": 0.9544131910766246, "eval_overall_f1": 0.8083989501312335, "eval_overall_precision": 0.7421686746987952, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3785, "eval_samples_per_second": 494.113, "eval_steps_per_second": 7.927, "step": 2226 }, { "epoch": 22.0, "grad_norm": 1.1350208520889282, "learning_rate": 3.9000000000000006e-05, "loss": 0.0886, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7317073170731707, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6060606060606061, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6835443037974683, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5869565217391305, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14820407330989838, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8125819134993448, "eval_overall_precision": 0.7451923076923077, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3842, "eval_samples_per_second": 486.763, "eval_steps_per_second": 7.809, "step": 2332 }, { "epoch": 23.0, "grad_norm": 0.8477388620376587, "learning_rate": 3.85e-05, "loss": 0.0854, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6704545454545454, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8802588996763754, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8553459119496856, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13370120525360107, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8187919463087249, "eval_overall_precision": 0.7663316582914573, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3801, "eval_samples_per_second": 491.988, "eval_steps_per_second": 7.893, "step": 2438 }, { "epoch": 24.0, "grad_norm": 1.1856006383895874, "learning_rate": 3.8e-05, "loss": 0.0826, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.725, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6105263157894737, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8802588996763754, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8553459119496856, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15471965074539185, "eval_overall_accuracy": 0.9532007759456838, "eval_overall_f1": 0.8031704095112285, "eval_overall_precision": 0.7414634146341463, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3802, "eval_samples_per_second": 491.892, "eval_steps_per_second": 7.891, "step": 2544 }, { "epoch": 25.0, "grad_norm": 0.49151602387428284, "learning_rate": 3.7500000000000003e-05, "loss": 0.0807, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.7651006711409397, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7307692307692307, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7515923566878981, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6413043478260869, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8831168831168831, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8607594936708861, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14267697930335999, "eval_overall_accuracy": 0.9561105722599418, "eval_overall_f1": 0.809078771695594, "eval_overall_precision": 0.753731343283582, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3888, "eval_samples_per_second": 481.006, "eval_steps_per_second": 7.717, "step": 2650 }, { "epoch": 26.0, "grad_norm": 0.8003281354904175, "learning_rate": 3.7e-05, "loss": 0.0784, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7651006711409396, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6785714285714286, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8737864077669903, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8490566037735849, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.675, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.574468085106383, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 28, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15734340250492096, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.8085106382978724, "eval_overall_precision": 0.7506172839506173, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.381, "eval_samples_per_second": 490.758, "eval_steps_per_second": 7.873, "step": 2756 }, { "epoch": 27.0, "grad_norm": 0.7769756317138672, "learning_rate": 3.65e-05, "loss": 0.0752, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.7466666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7088607594936709, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8802588996763754, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8553459119496856, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6419753086419753, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5416666666666666, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15696412324905396, "eval_overall_accuracy": 0.9541707080504365, "eval_overall_f1": 0.7973333333333333, "eval_overall_precision": 0.7419354838709677, "eval_overall_recall": 0.861671469740634, "eval_runtime": 0.3811, "eval_samples_per_second": 490.643, "eval_steps_per_second": 7.871, "step": 2862 }, { "epoch": 28.0, "grad_norm": 1.2662298679351807, "learning_rate": 3.6e-05, "loss": 0.0747, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.7346938775510203, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7105263157894737, "eval_LOCATION_recall": 0.7605633802816901, "eval_ORGANIZATION_f1": 0.7483870967741936, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6444444444444445, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8867313915857605, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8616352201257862, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15037189424037933, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8113207547169812, "eval_overall_precision": 0.7620253164556962, "eval_overall_recall": 0.8674351585014409, "eval_runtime": 0.3804, "eval_samples_per_second": 491.554, "eval_steps_per_second": 7.886, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.4553508162498474, "learning_rate": 3.55e-05, "loss": 0.073, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.7870967741935485, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7261904761904762, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7361963190184049, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6122448979591837, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1491299420595169, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8215223097112859, "eval_overall_precision": 0.7542168674698795, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3799, "eval_samples_per_second": 492.196, "eval_steps_per_second": 7.896, "step": 3074 }, { "epoch": 30.0, "grad_norm": 0.8037567138671875, "learning_rate": 3.5e-05, "loss": 0.0722, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.7894736842105262, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7393939393939394, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.61, "eval_ORGANIZATION_recall": 0.9384615384615385, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15461239218711853, "eval_overall_accuracy": 0.9539282250242483, "eval_overall_f1": 0.8178243774574051, "eval_overall_precision": 0.75, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3813, "eval_samples_per_second": 490.39, "eval_steps_per_second": 7.867, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.863256573677063, "learning_rate": 3.45e-05, "loss": 0.0691, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7368421052631579, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6436781609195402, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.9285714285714286, "eval_TIME_number": 28, "eval_TIME_precision": 0.9285714285714286, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1460384577512741, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.824631860776439, "eval_overall_precision": 0.77, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.381, "eval_samples_per_second": 490.806, "eval_steps_per_second": 7.874, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.5189836025238037, "learning_rate": 3.4000000000000007e-05, "loss": 0.0677, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.725, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6105263157894737, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.6835443037974683, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5869565217391305, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1576639711856842, "eval_overall_accuracy": 0.9546556741028128, "eval_overall_f1": 0.8110236220472441, "eval_overall_precision": 0.744578313253012, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3784, "eval_samples_per_second": 494.206, "eval_steps_per_second": 7.928, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.9570697546005249, "learning_rate": 3.35e-05, "loss": 0.0656, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.7450980392156863, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6951219512195121, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7295597484276729, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6170212765957447, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8524590163934426, "eval_TIME_number": 28, "eval_TIME_precision": 0.7878787878787878, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.15803979337215424, "eval_overall_accuracy": 0.9544131910766246, "eval_overall_f1": 0.8078947368421052, "eval_overall_precision": 0.7433414043583535, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3813, "eval_samples_per_second": 490.461, "eval_steps_per_second": 7.868, "step": 3498 }, { "epoch": 34.0, "grad_norm": 0.5982742309570312, "learning_rate": 3.3e-05, "loss": 0.0665, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7945205479452054, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7160493827160493, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14798475801944733, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8178137651821863, "eval_overall_precision": 0.7690355329949239, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3819, "eval_samples_per_second": 489.71, "eval_steps_per_second": 7.856, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.8073542714118958, "learning_rate": 3.2500000000000004e-05, "loss": 0.063, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7080745341614907, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.59375, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16065409779548645, "eval_overall_accuracy": 0.9551406401551892, "eval_overall_f1": 0.8005249343832022, "eval_overall_precision": 0.7349397590361446, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3816, "eval_samples_per_second": 490.048, "eval_steps_per_second": 7.862, "step": 3710 }, { "epoch": 36.0, "grad_norm": 1.0155664682388306, "learning_rate": 3.2000000000000005e-05, "loss": 0.0591, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7435897435897436, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6373626373626373, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16883772611618042, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8121693121693121, "eval_overall_precision": 0.7506112469437652, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3804, "eval_samples_per_second": 491.571, "eval_steps_per_second": 7.886, "step": 3816 }, { "epoch": 37.0, "grad_norm": 0.546472430229187, "learning_rate": 3.15e-05, "loss": 0.0601, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.7643312101910827, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6976744186046512, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7195121951219511, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5959595959595959, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6835443037974683, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5869565217391305, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1751433163881302, "eval_overall_accuracy": 0.9515033947623667, "eval_overall_f1": 0.8067444876783398, "eval_overall_precision": 0.7334905660377359, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3807, "eval_samples_per_second": 491.234, "eval_steps_per_second": 7.881, "step": 3922 }, { "epoch": 38.0, "grad_norm": 1.2387559413909912, "learning_rate": 3.1e-05, "loss": 0.0624, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7755102040816327, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6951219512195121, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.675, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.574468085106383, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8727272727272727, "eval_TIME_number": 28, "eval_TIME_precision": 0.8888888888888888, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16471463441848755, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.8134228187919462, "eval_overall_precision": 0.7613065326633166, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3803, "eval_samples_per_second": 491.693, "eval_steps_per_second": 7.888, "step": 4028 }, { "epoch": 39.0, "grad_norm": 1.1353509426116943, "learning_rate": 3.05e-05, "loss": 0.0609, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7483870967741936, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6444444444444445, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15616856515407562, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.821954484605087, "eval_overall_precision": 0.7675, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3789, "eval_samples_per_second": 493.535, "eval_steps_per_second": 7.918, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.9101806282997131, "learning_rate": 3e-05, "loss": 0.057, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7388535031847134, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6304347826086957, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1563103348016739, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.8122503328894807, "eval_overall_precision": 0.754950495049505, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3832, "eval_samples_per_second": 488.013, "eval_steps_per_second": 7.829, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.3714537024497986, "learning_rate": 2.95e-05, "loss": 0.0588, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7341772151898733, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6236559139784946, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16024786233901978, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.8111702127659575, "eval_overall_precision": 0.7530864197530864, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3803, "eval_samples_per_second": 491.781, "eval_steps_per_second": 7.89, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.28185874223709106, "learning_rate": 2.9e-05, "loss": 0.0537, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6179775280898876, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8253968253968255, "eval_TIME_number": 28, "eval_TIME_precision": 0.7428571428571429, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16531838476657867, "eval_overall_accuracy": 0.953443258971872, "eval_overall_f1": 0.8015873015873015, "eval_overall_precision": 0.7408312958435208, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3794, "eval_samples_per_second": 492.881, "eval_steps_per_second": 7.907, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.7425450682640076, "learning_rate": 2.8499999999999998e-05, "loss": 0.0565, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7483870967741936, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6444444444444445, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6265060240963856, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.52, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.7878787878787878, "eval_TIME_number": 28, "eval_TIME_precision": 0.6842105263157895, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17831364274024963, "eval_overall_accuracy": 0.9527158098933075, "eval_overall_f1": 0.7947712418300654, "eval_overall_precision": 0.7272727272727273, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3828, "eval_samples_per_second": 488.483, "eval_steps_per_second": 7.837, "step": 4558 }, { "epoch": 44.0, "grad_norm": 0.7398239374160767, "learning_rate": 2.8000000000000003e-05, "loss": 0.0564, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.7651006711409397, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7307692307692307, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7662337662337663, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6629213483146067, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1617172211408615, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8155080213903744, "eval_overall_precision": 0.7605985037406484, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3803, "eval_samples_per_second": 491.678, "eval_steps_per_second": 7.888, "step": 4664 }, { "epoch": 45.0, "grad_norm": 1.9621509313583374, "learning_rate": 2.7500000000000004e-05, "loss": 0.053, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7891156462585034, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7073170731707317, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1658838987350464, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8150134048257373, "eval_overall_precision": 0.7619047619047619, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.382, "eval_samples_per_second": 489.542, "eval_steps_per_second": 7.854, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.8231198787689209, "learning_rate": 2.7000000000000002e-05, "loss": 0.0503, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8817891373801918, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8466257668711656, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16653133928775787, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.824631860776439, "eval_overall_precision": 0.77, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.38, "eval_samples_per_second": 492.088, "eval_steps_per_second": 7.894, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.7595716118812561, "learning_rate": 2.6500000000000004e-05, "loss": 0.0513, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7702702702702702, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6867469879518072, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16581283509731293, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8225806451612904, "eval_overall_precision": 0.7707808564231738, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3809, "eval_samples_per_second": 490.938, "eval_steps_per_second": 7.876, "step": 4982 }, { "epoch": 48.0, "grad_norm": 0.855539858341217, "learning_rate": 2.6000000000000002e-05, "loss": 0.0501, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7581699346405228, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6590909090909091, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1663612574338913, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8122503328894807, "eval_overall_precision": 0.754950495049505, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3811, "eval_samples_per_second": 490.649, "eval_steps_per_second": 7.871, "step": 5088 }, { "epoch": 49.0, "grad_norm": 1.5128129720687866, "learning_rate": 2.5500000000000003e-05, "loss": 0.0497, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7785234899328859, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6904761904761905, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16162331402301788, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8197596795727637, "eval_overall_precision": 0.763681592039801, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3826, "eval_samples_per_second": 488.697, "eval_steps_per_second": 7.84, "step": 5194 }, { "epoch": 50.0, "grad_norm": 1.2246452569961548, "learning_rate": 2.5e-05, "loss": 0.0478, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8681672025723473, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8385093167701864, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16639897227287292, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.809078771695594, "eval_overall_precision": 0.753731343283582, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3797, "eval_samples_per_second": 492.491, "eval_steps_per_second": 7.901, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.46794039011001587, "learning_rate": 2.45e-05, "loss": 0.0481, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1614912897348404, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8164893617021276, "eval_overall_precision": 0.7580246913580246, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3874, "eval_samples_per_second": 482.673, "eval_steps_per_second": 7.743, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.9891065359115601, "learning_rate": 2.4e-05, "loss": 0.0467, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6704545454545454, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8753993610223643, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8404907975460123, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.6666666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5625, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8387096774193549, "eval_TIME_number": 28, "eval_TIME_precision": 0.7647058823529411, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17710401117801666, "eval_overall_accuracy": 0.954898157129001, "eval_overall_f1": 0.8078947368421052, "eval_overall_precision": 0.7433414043583535, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3803, "eval_samples_per_second": 491.68, "eval_steps_per_second": 7.888, "step": 5512 }, { "epoch": 53.0, "grad_norm": 1.105144739151001, "learning_rate": 2.35e-05, "loss": 0.0454, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17059719562530518, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8192771084337349, "eval_overall_precision": 0.765, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3808, "eval_samples_per_second": 491.088, "eval_steps_per_second": 7.878, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.8647188544273376, "learning_rate": 2.3000000000000003e-05, "loss": 0.0423, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.7651006711409397, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7307692307692307, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7972972972972974, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7108433734939759, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8653846153846153, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8333333333333334, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17431387305259705, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8161073825503355, "eval_overall_precision": 0.7638190954773869, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.381, "eval_samples_per_second": 490.855, "eval_steps_per_second": 7.875, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.8007002472877502, "learning_rate": 2.25e-05, "loss": 0.0454, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7837837837837838, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6987951807228916, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.172898069024086, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8225806451612904, "eval_overall_precision": 0.7707808564231738, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.38, "eval_samples_per_second": 492.135, "eval_steps_per_second": 7.895, "step": 5830 }, { "epoch": 56.0, "grad_norm": 1.071050763130188, "learning_rate": 2.2000000000000003e-05, "loss": 0.0445, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.802721088435374, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7195121951219512, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16954554617404938, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.825268817204301, "eval_overall_precision": 0.7732997481108312, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3811, "eval_samples_per_second": 490.727, "eval_steps_per_second": 7.873, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.8882637619972229, "learning_rate": 2.15e-05, "loss": 0.0426, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7887323943661972, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7272727272727273, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18545663356781006, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8265582655826558, "eval_overall_precision": 0.7800511508951407, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3807, "eval_samples_per_second": 491.172, "eval_steps_per_second": 7.88, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.8679073452949524, "learning_rate": 2.1e-05, "loss": 0.0423, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.7651006711409397, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7307692307692307, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7916666666666667, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7215189873417721, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8717948717948718, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8395061728395061, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17360354959964752, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8233695652173914, "eval_overall_precision": 0.7789203084832905, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.381, "eval_samples_per_second": 490.858, "eval_steps_per_second": 7.875, "step": 6148 }, { "epoch": 59.0, "grad_norm": 2.275029420852661, "learning_rate": 2.05e-05, "loss": 0.0431, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7972972972972974, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7108433734939759, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1791093796491623, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8247978436657682, "eval_overall_precision": 0.7746835443037975, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3794, "eval_samples_per_second": 492.887, "eval_steps_per_second": 7.907, "step": 6254 }, { "epoch": 60.0, "grad_norm": 2.5058839321136475, "learning_rate": 2e-05, "loss": 0.0428, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7792207792207791, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6741573033707865, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8782051282051282, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.845679012345679, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17754900455474854, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.823529411764706, "eval_overall_precision": 0.7680798004987531, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3808, "eval_samples_per_second": 491.029, "eval_steps_per_second": 7.877, "step": 6360 }, { "epoch": 61.0, "grad_norm": 0.7865079045295715, "learning_rate": 1.9500000000000003e-05, "loss": 0.0413, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7891156462585034, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7073170731707317, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.870967741935484, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84375, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16769103705883026, "eval_overall_accuracy": 0.9602327837051406, "eval_overall_f1": 0.8243243243243243, "eval_overall_precision": 0.7760814249363868, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3783, "eval_samples_per_second": 494.306, "eval_steps_per_second": 7.93, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.5289219617843628, "learning_rate": 1.9e-05, "loss": 0.0398, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7354838709677419, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6333333333333333, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8745980707395499, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84472049689441, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18425512313842773, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8100929614873836, "eval_overall_precision": 0.7512315270935961, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.381, "eval_samples_per_second": 490.826, "eval_steps_per_second": 7.874, "step": 6572 }, { "epoch": 63.0, "grad_norm": 0.5517676472663879, "learning_rate": 1.85e-05, "loss": 0.0375, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.76, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7329192546583851, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6145833333333334, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18431755900382996, "eval_overall_accuracy": 0.9541707080504365, "eval_overall_f1": 0.8068783068783069, "eval_overall_precision": 0.7457212713936431, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3828, "eval_samples_per_second": 488.495, "eval_steps_per_second": 7.837, "step": 6678 }, { "epoch": 64.0, "grad_norm": 0.43984198570251465, "learning_rate": 1.8e-05, "loss": 0.0393, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7945205479452054, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7160493827160493, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1756104677915573, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.827027027027027, "eval_overall_precision": 0.7786259541984732, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3797, "eval_samples_per_second": 492.431, "eval_steps_per_second": 7.9, "step": 6784 }, { "epoch": 65.0, "grad_norm": 0.6901776194572449, "learning_rate": 1.75e-05, "loss": 0.0381, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7682119205298013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6744186046511628, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7397260273972603, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18173794448375702, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8203753351206434, "eval_overall_precision": 0.7669172932330827, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3821, "eval_samples_per_second": 489.382, "eval_steps_per_second": 7.851, "step": 6890 }, { "epoch": 66.0, "grad_norm": 1.4130526781082153, "learning_rate": 1.7000000000000003e-05, "loss": 0.0391, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.7702702702702703, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7402597402597403, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7483870967741936, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6444444444444445, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1838272213935852, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8149134487350199, "eval_overall_precision": 0.7574257425742574, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3826, "eval_samples_per_second": 488.807, "eval_steps_per_second": 7.842, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.6909719109535217, "learning_rate": 1.65e-05, "loss": 0.0378, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.7402597402597403, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6867469879518072, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7307692307692307, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6263736263736264, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.19103722274303436, "eval_overall_accuracy": 0.9551406401551892, "eval_overall_f1": 0.8068783068783069, "eval_overall_precision": 0.7457212713936431, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3805, "eval_samples_per_second": 491.5, "eval_steps_per_second": 7.885, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.3753189742565155, "learning_rate": 1.6000000000000003e-05, "loss": 0.0385, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7919463087248322, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7023809523809523, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.870967741935484, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.84375, "eval_PERSON_recall": 0.9, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18312758207321167, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8176943699731903, "eval_overall_precision": 0.7644110275689223, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3806, "eval_samples_per_second": 491.353, "eval_steps_per_second": 7.883, "step": 7208 }, { "epoch": 69.0, "grad_norm": 1.2078567743301392, "learning_rate": 1.55e-05, "loss": 0.0382, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.7837837837837838, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7515923566878981, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6413043478260869, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17568355798721313, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8186666666666667, "eval_overall_precision": 0.7617866004962779, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.38, "eval_samples_per_second": 492.048, "eval_steps_per_second": 7.894, "step": 7314 }, { "epoch": 70.0, "grad_norm": 0.411945104598999, "learning_rate": 1.5e-05, "loss": 0.0363, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.7837837837837838, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7972972972972974, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7108433734939759, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17883449792861938, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8274932614555257, "eval_overall_precision": 0.7772151898734178, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3804, "eval_samples_per_second": 491.549, "eval_steps_per_second": 7.886, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.6801556348800659, "learning_rate": 1.45e-05, "loss": 0.0351, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7662337662337663, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6629213483146067, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8846153846153846, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8518518518518519, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18632389605045319, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.8202396804260986, "eval_overall_precision": 0.7623762376237624, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3814, "eval_samples_per_second": 490.305, "eval_steps_per_second": 7.866, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.6433190703392029, "learning_rate": 1.4000000000000001e-05, "loss": 0.0353, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7341772151898733, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6236559139784946, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8838709677419355, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85625, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18783344328403473, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8116710875331565, "eval_overall_precision": 0.7518427518427518, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3807, "eval_samples_per_second": 491.151, "eval_steps_per_second": 7.879, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.3200623095035553, "learning_rate": 1.3500000000000001e-05, "loss": 0.0343, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.7837837837837838, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7581699346405228, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6590909090909091, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.17813065648078918, "eval_overall_accuracy": 0.9575654704170709, "eval_overall_f1": 0.8198924731182795, "eval_overall_precision": 0.7682619647355163, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.38, "eval_samples_per_second": 492.144, "eval_steps_per_second": 7.895, "step": 7738 }, { "epoch": 74.0, "grad_norm": 0.39253032207489014, "learning_rate": 1.3000000000000001e-05, "loss": 0.0338, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7891156462585034, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7073170731707317, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18210819363594055, "eval_overall_accuracy": 0.9616876818622696, "eval_overall_f1": 0.830393487109905, "eval_overall_precision": 0.7846153846153846, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3797, "eval_samples_per_second": 492.508, "eval_steps_per_second": 7.901, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.9440187811851501, "learning_rate": 1.25e-05, "loss": 0.0338, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7837837837837838, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6987951807228916, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18501493334770203, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.82907133243607, "eval_overall_precision": 0.7777777777777778, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3803, "eval_samples_per_second": 491.709, "eval_steps_per_second": 7.888, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.030535509809851646, "learning_rate": 1.2e-05, "loss": 0.0348, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8774193548387097, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.85, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18246251344680786, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8172043010752689, "eval_overall_precision": 0.7657430730478589, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3836, "eval_samples_per_second": 487.539, "eval_steps_per_second": 7.821, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.3823874294757843, "learning_rate": 1.1500000000000002e-05, "loss": 0.0349, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7916666666666667, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7215189873417721, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8810289389067525, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8509316770186336, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1836749166250229, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8288043478260869, "eval_overall_precision": 0.7840616966580977, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3828, "eval_samples_per_second": 488.496, "eval_steps_per_second": 7.837, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.7046309113502502, "learning_rate": 1.1000000000000001e-05, "loss": 0.0332, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.7837837837837838, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18720394372940063, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8313090418353577, "eval_overall_precision": 0.7817258883248731, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3838, "eval_samples_per_second": 487.247, "eval_steps_per_second": 7.817, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.7197487354278564, "learning_rate": 1.05e-05, "loss": 0.0348, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.181439608335495, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.830188679245283, "eval_overall_precision": 0.779746835443038, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3799, "eval_samples_per_second": 492.17, "eval_steps_per_second": 7.896, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.49554863572120667, "learning_rate": 1e-05, "loss": 0.0327, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7814569536423841, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.686046511627907, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18670083582401276, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8322147651006712, "eval_overall_precision": 0.7788944723618091, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3815, "eval_samples_per_second": 490.142, "eval_steps_per_second": 7.863, "step": 8480 }, { "epoch": 81.0, "grad_norm": 0.4919203817844391, "learning_rate": 9.5e-06, "loss": 0.0304, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7891156462585034, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7073170731707317, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.18983295559883118, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8313090418353577, "eval_overall_precision": 0.7817258883248731, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.38, "eval_samples_per_second": 492.144, "eval_steps_per_second": 7.895, "step": 8586 }, { "epoch": 82.0, "grad_norm": 1.3511189222335815, "learning_rate": 9e-06, "loss": 0.0311, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7763157894736842, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6781609195402298, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19013887643814087, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8284182305630027, "eval_overall_precision": 0.7744360902255639, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3801, "eval_samples_per_second": 491.997, "eval_steps_per_second": 7.893, "step": 8692 }, { "epoch": 83.0, "grad_norm": 1.181095838546753, "learning_rate": 8.500000000000002e-06, "loss": 0.0311, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.7651006711409397, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7307692307692307, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7450980392156863, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6477272727272727, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.18673187494277954, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8176943699731903, "eval_overall_precision": 0.7644110275689223, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3803, "eval_samples_per_second": 491.728, "eval_steps_per_second": 7.889, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.2343386560678482, "learning_rate": 8.000000000000001e-06, "loss": 0.0311, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.7682119205298014, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.725, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7702702702702702, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6867469879518072, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19123651087284088, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8247978436657682, "eval_overall_precision": 0.7746835443037975, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3809, "eval_samples_per_second": 490.888, "eval_steps_per_second": 7.875, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.7187972664833069, "learning_rate": 7.5e-06, "loss": 0.0316, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7651006711409396, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6785714285714286, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19598372280597687, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.82907133243607, "eval_overall_precision": 0.7777777777777778, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3804, "eval_samples_per_second": 491.562, "eval_steps_per_second": 7.886, "step": 9010 }, { "epoch": 86.0, "grad_norm": 0.7457745671272278, "learning_rate": 7.000000000000001e-06, "loss": 0.0302, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6551724137931034, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7105263157894738, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.627906976744186, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19160479307174683, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8257372654155496, "eval_overall_precision": 0.7719298245614035, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3793, "eval_samples_per_second": 493.05, "eval_steps_per_second": 7.91, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.7893774509429932, "learning_rate": 6.5000000000000004e-06, "loss": 0.0302, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7792207792207793, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7532467532467532, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.651685393258427, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19260451197624207, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8310991957104558, "eval_overall_precision": 0.7769423558897243, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3814, "eval_samples_per_second": 490.309, "eval_steps_per_second": 7.866, "step": 9222 }, { "epoch": 88.0, "grad_norm": 0.9674557447433472, "learning_rate": 6e-06, "loss": 0.0301, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7549668874172185, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6627906976744186, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19156460464000702, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8268456375838926, "eval_overall_precision": 0.7738693467336684, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.38, "eval_samples_per_second": 492.071, "eval_steps_per_second": 7.894, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.4081524610519409, "learning_rate": 5.500000000000001e-06, "loss": 0.0291, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7549668874172185, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6627906976744186, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8932038834951457, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8679245283018868, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6923076923076923, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8666666666666666, "eval_TIME_number": 28, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1988055408000946, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.822429906542056, "eval_overall_precision": 0.7661691542288557, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3814, "eval_samples_per_second": 490.312, "eval_steps_per_second": 7.866, "step": 9434 }, { "epoch": 90.0, "grad_norm": 1.2055195569992065, "learning_rate": 5e-06, "loss": 0.029, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.7972972972972973, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7662337662337663, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7682119205298013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6744186046511628, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19222281873226166, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8306451612903226, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3817, "eval_samples_per_second": 489.931, "eval_steps_per_second": 7.86, "step": 9540 }, { "epoch": 91.0, "grad_norm": 1.7582001686096191, "learning_rate": 4.5e-06, "loss": 0.0281, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7549668874172185, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6627906976744186, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.896551724137931, "eval_TIME_number": 28, "eval_TIME_precision": 0.8666666666666667, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19376523792743683, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8268456375838926, "eval_overall_precision": 0.7738693467336684, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.381, "eval_samples_per_second": 490.839, "eval_steps_per_second": 7.874, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.382251501083374, "learning_rate": 4.000000000000001e-06, "loss": 0.0293, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.7549668874172185, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7125, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6551724137931034, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19469353556632996, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8181818181818181, "eval_overall_precision": 0.7630922693266833, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3841, "eval_samples_per_second": 486.911, "eval_steps_per_second": 7.811, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.3737156391143799, "learning_rate": 3.5000000000000004e-06, "loss": 0.0279, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.7712418300653594, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7195121951219512, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6551724137931034, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1938970983028412, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8213333333333332, "eval_overall_precision": 0.7642679900744417, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3809, "eval_samples_per_second": 490.922, "eval_steps_per_second": 7.876, "step": 9858 }, { "epoch": 94.0, "grad_norm": 0.39239442348480225, "learning_rate": 3e-06, "loss": 0.0284, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.7581699346405228, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7073170731707317, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7549668874172185, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6627906976744186, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19448162615299225, "eval_overall_accuracy": 0.9573229873908826, "eval_overall_f1": 0.8181818181818181, "eval_overall_precision": 0.7630922693266833, "eval_overall_recall": 0.8818443804034583, "eval_runtime": 0.3812, "eval_samples_per_second": 490.524, "eval_steps_per_second": 7.869, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.2501358091831207, "learning_rate": 2.5e-06, "loss": 0.0277, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19271968305110931, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8263795423956932, "eval_overall_precision": 0.7752525252525253, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.38, "eval_samples_per_second": 492.071, "eval_steps_per_second": 7.894, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.3346474766731262, "learning_rate": 2.0000000000000003e-06, "loss": 0.0287, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.7919463087248323, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19360853731632233, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.82907133243607, "eval_overall_precision": 0.7777777777777778, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3831, "eval_samples_per_second": 488.178, "eval_steps_per_second": 7.832, "step": 10176 }, { "epoch": 97.0, "grad_norm": 0.5980328917503357, "learning_rate": 1.5e-06, "loss": 0.0295, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1938299536705017, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8306451612903226, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.381, "eval_samples_per_second": 490.819, "eval_steps_per_second": 7.874, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.5382476449012756, "learning_rate": 1.0000000000000002e-06, "loss": 0.028, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.19374345242977142, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8306451612903226, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3823, "eval_samples_per_second": 489.131, "eval_steps_per_second": 7.847, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.7957453727722168, "learning_rate": 5.000000000000001e-07, "loss": 0.0288, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7682119205298013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6744186046511628, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1937512904405594, "eval_overall_accuracy": 0.9580504364694471, "eval_overall_f1": 0.8268456375838926, "eval_overall_precision": 0.7738693467336684, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3822, "eval_samples_per_second": 489.325, "eval_steps_per_second": 7.85, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.36327624320983887, "learning_rate": 0.0, "loss": 0.0272, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7297297297297297, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6585365853658537, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1937185674905777, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8279569892473119, "eval_overall_precision": 0.7758186397984886, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3796, "eval_samples_per_second": 492.654, "eval_steps_per_second": 7.904, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5123217774191952.0, "train_loss": 0.07702873169251208, "train_runtime": 615.3274, "train_samples_per_second": 274.326, "train_steps_per_second": 17.227 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5123217774191952.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }