nerugm-pt-pl20-3 / trainer_state.json
apwic's picture
End of training
15de95b verified
raw
history blame contribute delete
No virus
145 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 2.678309202194214,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9941,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.01183431952662722,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.05263157894736842,
"eval_PERSON_recall": 0.006666666666666667,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0689655172413793,
"eval_TIME_number": 28,
"eval_TIME_precision": 1.0,
"eval_TIME_recall": 0.03571428571428571,
"eval_loss": 0.5622514486312866,
"eval_overall_accuracy": 0.8440834141610087,
"eval_overall_f1": 0.010471204188481676,
"eval_overall_precision": 0.05714285714285714,
"eval_overall_recall": 0.005763688760806916,
"eval_runtime": 0.3767,
"eval_samples_per_second": 496.365,
"eval_steps_per_second": 7.963,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.0868268013000488,
"learning_rate": 4.9e-05,
"loss": 0.4917,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.36036036036036034,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5,
"eval_LOCATION_recall": 0.28169014084507044,
"eval_ORGANIZATION_f1": 0.10909090909090909,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.13333333333333333,
"eval_ORGANIZATION_recall": 0.09230769230769231,
"eval_PERSON_f1": 0.7146974063400575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.6294416243654822,
"eval_PERSON_recall": 0.8266666666666667,
"eval_QUANTITY_f1": 0.125,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.12903225806451613,
"eval_QUANTITY_recall": 0.12121212121212122,
"eval_TIME_f1": 0.7164179104477612,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6153846153846154,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.34143543243408203,
"eval_overall_accuracy": 0.9042192046556741,
"eval_overall_f1": 0.5092989985693849,
"eval_overall_precision": 0.5056818181818182,
"eval_overall_recall": 0.5129682997118156,
"eval_runtime": 0.3785,
"eval_samples_per_second": 493.993,
"eval_steps_per_second": 7.925,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 0.8501033186912537,
"learning_rate": 4.85e-05,
"loss": 0.3079,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.6111111111111112,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6027397260273972,
"eval_LOCATION_recall": 0.6197183098591549,
"eval_ORGANIZATION_f1": 0.573170731707317,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.47474747474747475,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.8173374613003096,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7630057803468208,
"eval_PERSON_recall": 0.88,
"eval_QUANTITY_f1": 0.5641025641025641,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.4888888888888889,
"eval_QUANTITY_recall": 0.6666666666666666,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8076923076923077,
"eval_TIME_recall": 0.75,
"eval_loss": 0.21354812383651733,
"eval_overall_accuracy": 0.9277400581959263,
"eval_overall_f1": 0.6972477064220184,
"eval_overall_precision": 0.6394230769230769,
"eval_overall_recall": 0.7665706051873199,
"eval_runtime": 0.3794,
"eval_samples_per_second": 492.831,
"eval_steps_per_second": 7.906,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 0.8237155079841614,
"learning_rate": 4.8e-05,
"loss": 0.2193,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.641025641025641,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5882352941176471,
"eval_LOCATION_recall": 0.704225352112676,
"eval_ORGANIZATION_f1": 0.6010928961748634,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4661016949152542,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8395061728395062,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7816091954022989,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.5999999999999999,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5106382978723404,
"eval_QUANTITY_recall": 0.7272727272727273,
"eval_TIME_f1": 0.9090909090909091,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9259259259259259,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.17542287707328796,
"eval_overall_accuracy": 0.9391367604267701,
"eval_overall_f1": 0.7268170426065164,
"eval_overall_precision": 0.6430155210643016,
"eval_overall_recall": 0.8357348703170029,
"eval_runtime": 0.3799,
"eval_samples_per_second": 492.264,
"eval_steps_per_second": 7.897,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.2984700202941895,
"learning_rate": 4.75e-05,
"loss": 0.1845,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.6708860759493671,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6091954022988506,
"eval_LOCATION_recall": 0.7464788732394366,
"eval_ORGANIZATION_f1": 0.6710526315789473,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5862068965517241,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8411214953271027,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7894736842105263,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.5952380952380952,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.49019607843137253,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.7419354838709677,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6764705882352942,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.15947341918945312,
"eval_overall_accuracy": 0.944713870029098,
"eval_overall_f1": 0.7387387387387387,
"eval_overall_precision": 0.6674418604651163,
"eval_overall_recall": 0.8270893371757925,
"eval_runtime": 0.3795,
"eval_samples_per_second": 492.809,
"eval_steps_per_second": 7.906,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.3075064420700073,
"learning_rate": 4.7e-05,
"loss": 0.169,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.6785714285714287,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5876288659793815,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.6829268292682926,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5656565656565656,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8509316770186336,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7965116279069767,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6153846153846154,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.4827586206896552,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.676470588235294,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.575,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.18737278878688812,
"eval_overall_accuracy": 0.933074684772066,
"eval_overall_f1": 0.7404674046740467,
"eval_overall_precision": 0.6459227467811158,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3823,
"eval_samples_per_second": 489.095,
"eval_steps_per_second": 7.846,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 2.091857433319092,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1587,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.732919254658385,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6555555555555556,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.6878980891719746,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5869565217391305,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8633540372670808,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8081395348837209,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5490196078431373,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15555286407470703,
"eval_overall_accuracy": 0.9435014548981572,
"eval_overall_f1": 0.7725540025412961,
"eval_overall_precision": 0.6909090909090909,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.378,
"eval_samples_per_second": 494.694,
"eval_steps_per_second": 7.936,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.6778572201728821,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1422,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7065868263473054,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6145833333333334,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.6792452830188681,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.574468085106383,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8634920634920634,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8242424242424242,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7179487179487178,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6222222222222222,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7384615384615384,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6486486486486487,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.142758309841156,
"eval_overall_accuracy": 0.9483511154219205,
"eval_overall_f1": 0.7678571428571429,
"eval_overall_precision": 0.6887871853546911,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3796,
"eval_samples_per_second": 492.664,
"eval_steps_per_second": 7.904,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 0.740088701248169,
"learning_rate": 4.55e-05,
"loss": 0.1362,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7549668874172185,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7125,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.708860759493671,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6021505376344086,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5490196078431373,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13845409452915192,
"eval_overall_accuracy": 0.9515033947623667,
"eval_overall_f1": 0.7890625,
"eval_overall_precision": 0.7197149643705463,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3794,
"eval_samples_per_second": 492.924,
"eval_steps_per_second": 7.908,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.7449586391448975,
"learning_rate": 4.5e-05,
"loss": 0.1321,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7516778523489933,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.717948717948718,
"eval_LOCATION_recall": 0.7887323943661971,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8690095846645367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7179487179487178,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6222222222222222,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12999238073825836,
"eval_overall_accuracy": 0.9553831231813773,
"eval_overall_f1": 0.7898936170212766,
"eval_overall_precision": 0.7333333333333333,
"eval_overall_recall": 0.8559077809798271,
"eval_runtime": 0.3805,
"eval_samples_per_second": 491.468,
"eval_steps_per_second": 7.885,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 1.6345419883728027,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1217,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7763157894736843,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7096774193548387,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6111111111111112,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7088607594936709,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6086956521739131,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13535159826278687,
"eval_overall_accuracy": 0.9512609117361784,
"eval_overall_f1": 0.8005284015852047,
"eval_overall_precision": 0.7390243902439024,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.12,
"eval_steps_per_second": 7.895,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.6287707090377808,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1192,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7643312101910827,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6976744186046512,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7261146496815286,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6195652173913043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13359412550926208,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8068331143232589,
"eval_overall_precision": 0.7415458937198067,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3781,
"eval_samples_per_second": 494.638,
"eval_steps_per_second": 7.935,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.46434441208839417,
"learning_rate": 4.35e-05,
"loss": 0.1138,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.794701986754967,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7204968944099378,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6041666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6585365853658536,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5510204081632653,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13541372120380402,
"eval_overall_accuracy": 0.9527158098933075,
"eval_overall_f1": 0.8005249343832022,
"eval_overall_precision": 0.7349397590361446,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3812,
"eval_samples_per_second": 490.62,
"eval_steps_per_second": 7.871,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 2.5094404220581055,
"learning_rate": 4.3e-05,
"loss": 0.1103,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.675,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.574468085106383,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1337423026561737,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8064085447263017,
"eval_overall_precision": 0.7512437810945274,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3799,
"eval_samples_per_second": 492.18,
"eval_steps_per_second": 7.896,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.8557437658309937,
"learning_rate": 4.25e-05,
"loss": 0.1038,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7272727272727273,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6292134831460674,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.675,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.574468085106383,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1362387090921402,
"eval_overall_accuracy": 0.9546556741028128,
"eval_overall_f1": 0.8031704095112285,
"eval_overall_precision": 0.7414634146341463,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3807,
"eval_samples_per_second": 491.261,
"eval_steps_per_second": 7.881,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.1418652534484863,
"learning_rate": 4.2e-05,
"loss": 0.1016,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7341772151898734,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6585365853658536,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5510204081632653,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1373499035835266,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8042609853528628,
"eval_overall_precision": 0.7475247524752475,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.3807,
"eval_samples_per_second": 491.2,
"eval_steps_per_second": 7.88,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.8007000684738159,
"learning_rate": 4.15e-05,
"loss": 0.1008,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1264466941356659,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.8123324396782842,
"eval_overall_precision": 0.7593984962406015,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3813,
"eval_samples_per_second": 490.475,
"eval_steps_per_second": 7.869,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.6803272366523743,
"learning_rate": 4.1e-05,
"loss": 0.0961,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.7549668874172185,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7125,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7044025157232704,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5957446808510638,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14231978356838226,
"eval_overall_accuracy": 0.9541707080504365,
"eval_overall_f1": 0.7936925098554534,
"eval_overall_precision": 0.7294685990338164,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.088,
"eval_steps_per_second": 7.894,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.7480773329734802,
"learning_rate": 4.05e-05,
"loss": 0.0927,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.7552447552447553,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.7605633802816901,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6444444444444445,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12808914482593536,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8113207547169812,
"eval_overall_precision": 0.7620253164556962,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3783,
"eval_samples_per_second": 494.38,
"eval_steps_per_second": 7.931,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.7538065314292908,
"learning_rate": 4e-05,
"loss": 0.0896,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.7741935483870968,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7532467532467532,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.651685393258427,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.9090909090909091,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9259259259259259,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13772721588611603,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8170894526034712,
"eval_overall_precision": 0.7611940298507462,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3854,
"eval_samples_per_second": 485.188,
"eval_steps_per_second": 7.784,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.0004348754882812,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0881,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.794701986754967,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7361963190184049,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6122448979591837,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14643645286560059,
"eval_overall_accuracy": 0.9544131910766246,
"eval_overall_f1": 0.8083989501312335,
"eval_overall_precision": 0.7421686746987952,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3785,
"eval_samples_per_second": 494.113,
"eval_steps_per_second": 7.927,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 1.1350208520889282,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0886,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7317073170731707,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6060606060606061,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6835443037974683,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5869565217391305,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14820407330989838,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8125819134993448,
"eval_overall_precision": 0.7451923076923077,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3842,
"eval_samples_per_second": 486.763,
"eval_steps_per_second": 7.809,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.8477388620376587,
"learning_rate": 3.85e-05,
"loss": 0.0854,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.7919463087248323,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6704545454545454,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13370120525360107,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8187919463087249,
"eval_overall_precision": 0.7663316582914573,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3801,
"eval_samples_per_second": 491.988,
"eval_steps_per_second": 7.893,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.1856006383895874,
"learning_rate": 3.8e-05,
"loss": 0.0826,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7631578947368421,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.725,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6105263157894737,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15471965074539185,
"eval_overall_accuracy": 0.9532007759456838,
"eval_overall_f1": 0.8031704095112285,
"eval_overall_precision": 0.7414634146341463,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3802,
"eval_samples_per_second": 491.892,
"eval_steps_per_second": 7.891,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.49151602387428284,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0807,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7651006711409397,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7307692307692307,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7515923566878981,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6413043478260869,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8831168831168831,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14267697930335999,
"eval_overall_accuracy": 0.9561105722599418,
"eval_overall_f1": 0.809078771695594,
"eval_overall_precision": 0.753731343283582,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3888,
"eval_samples_per_second": 481.006,
"eval_steps_per_second": 7.717,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.8003281354904175,
"learning_rate": 3.7e-05,
"loss": 0.0784,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7651006711409396,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6785714285714286,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8737864077669903,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.675,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.574468085106383,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15734340250492096,
"eval_overall_accuracy": 0.954898157129001,
"eval_overall_f1": 0.8085106382978724,
"eval_overall_precision": 0.7506172839506173,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.381,
"eval_samples_per_second": 490.758,
"eval_steps_per_second": 7.873,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.7769756317138672,
"learning_rate": 3.65e-05,
"loss": 0.0752,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7466666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7088607594936709,
"eval_LOCATION_recall": 0.7887323943661971,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6419753086419753,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5416666666666666,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15696412324905396,
"eval_overall_accuracy": 0.9541707080504365,
"eval_overall_f1": 0.7973333333333333,
"eval_overall_precision": 0.7419354838709677,
"eval_overall_recall": 0.861671469740634,
"eval_runtime": 0.3811,
"eval_samples_per_second": 490.643,
"eval_steps_per_second": 7.871,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.2662298679351807,
"learning_rate": 3.6e-05,
"loss": 0.0747,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7346938775510203,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7105263157894737,
"eval_LOCATION_recall": 0.7605633802816901,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6444444444444445,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15037189424037933,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8113207547169812,
"eval_overall_precision": 0.7620253164556962,
"eval_overall_recall": 0.8674351585014409,
"eval_runtime": 0.3804,
"eval_samples_per_second": 491.554,
"eval_steps_per_second": 7.886,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.4553508162498474,
"learning_rate": 3.55e-05,
"loss": 0.073,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.7870967741935485,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7361963190184049,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6122448979591837,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1491299420595169,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8215223097112859,
"eval_overall_precision": 0.7542168674698795,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3799,
"eval_samples_per_second": 492.196,
"eval_steps_per_second": 7.896,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.8037567138671875,
"learning_rate": 3.5e-05,
"loss": 0.0722,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7393939393939394,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.61,
"eval_ORGANIZATION_recall": 0.9384615384615385,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15461239218711853,
"eval_overall_accuracy": 0.9539282250242483,
"eval_overall_f1": 0.8178243774574051,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3813,
"eval_samples_per_second": 490.39,
"eval_steps_per_second": 7.867,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.863256573677063,
"learning_rate": 3.45e-05,
"loss": 0.0691,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7368421052631579,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6436781609195402,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.9285714285714286,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9285714285714286,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1460384577512741,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.824631860776439,
"eval_overall_precision": 0.77,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.381,
"eval_samples_per_second": 490.806,
"eval_steps_per_second": 7.874,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.5189836025238037,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0677,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.7763157894736843,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.725,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6105263157894737,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6835443037974683,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5869565217391305,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1576639711856842,
"eval_overall_accuracy": 0.9546556741028128,
"eval_overall_f1": 0.8110236220472441,
"eval_overall_precision": 0.744578313253012,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3784,
"eval_samples_per_second": 494.206,
"eval_steps_per_second": 7.928,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.9570697546005249,
"learning_rate": 3.35e-05,
"loss": 0.0656,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.7450980392156863,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6951219512195121,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7295597484276729,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6170212765957447,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.15803979337215424,
"eval_overall_accuracy": 0.9544131910766246,
"eval_overall_f1": 0.8078947368421052,
"eval_overall_precision": 0.7433414043583535,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3813,
"eval_samples_per_second": 490.461,
"eval_steps_per_second": 7.868,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.5982742309570312,
"learning_rate": 3.3e-05,
"loss": 0.0665,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.76,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7945205479452054,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7160493827160493,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14798475801944733,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8178137651821863,
"eval_overall_precision": 0.7690355329949239,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3819,
"eval_samples_per_second": 489.71,
"eval_steps_per_second": 7.856,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.8073542714118958,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.063,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.7682119205298014,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7080745341614907,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.59375,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.16065409779548645,
"eval_overall_accuracy": 0.9551406401551892,
"eval_overall_f1": 0.8005249343832022,
"eval_overall_precision": 0.7349397590361446,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3816,
"eval_samples_per_second": 490.048,
"eval_steps_per_second": 7.862,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.0155664682388306,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0591,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7435897435897436,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6373626373626373,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.16883772611618042,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8121693121693121,
"eval_overall_precision": 0.7506112469437652,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3804,
"eval_samples_per_second": 491.571,
"eval_steps_per_second": 7.886,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.546472430229187,
"learning_rate": 3.15e-05,
"loss": 0.0601,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7643312101910827,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6976744186046512,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7195121951219511,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5959595959595959,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6835443037974683,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5869565217391305,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1751433163881302,
"eval_overall_accuracy": 0.9515033947623667,
"eval_overall_f1": 0.8067444876783398,
"eval_overall_precision": 0.7334905660377359,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3807,
"eval_samples_per_second": 491.234,
"eval_steps_per_second": 7.881,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 1.2387559413909912,
"learning_rate": 3.1e-05,
"loss": 0.0624,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.7631578947368421,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7755102040816327,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6951219512195121,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.675,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.574468085106383,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16471463441848755,
"eval_overall_accuracy": 0.954898157129001,
"eval_overall_f1": 0.8134228187919462,
"eval_overall_precision": 0.7613065326633166,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3803,
"eval_samples_per_second": 491.693,
"eval_steps_per_second": 7.888,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 1.1353509426116943,
"learning_rate": 3.05e-05,
"loss": 0.0609,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6444444444444445,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15616856515407562,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.821954484605087,
"eval_overall_precision": 0.7675,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3789,
"eval_samples_per_second": 493.535,
"eval_steps_per_second": 7.918,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.9101806282997131,
"learning_rate": 3e-05,
"loss": 0.057,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.76,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7388535031847134,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6304347826086957,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1563103348016739,
"eval_overall_accuracy": 0.9565955383123181,
"eval_overall_f1": 0.8122503328894807,
"eval_overall_precision": 0.754950495049505,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3832,
"eval_samples_per_second": 488.013,
"eval_steps_per_second": 7.829,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.3714537024497986,
"learning_rate": 2.95e-05,
"loss": 0.0588,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7549668874172185,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7125,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7341772151898733,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6236559139784946,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.16024786233901978,
"eval_overall_accuracy": 0.954898157129001,
"eval_overall_f1": 0.8111702127659575,
"eval_overall_precision": 0.7530864197530864,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3803,
"eval_samples_per_second": 491.781,
"eval_steps_per_second": 7.89,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.28185874223709106,
"learning_rate": 2.9e-05,
"loss": 0.0537,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.76,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6179775280898876,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16531838476657867,
"eval_overall_accuracy": 0.953443258971872,
"eval_overall_f1": 0.8015873015873015,
"eval_overall_precision": 0.7408312958435208,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3794,
"eval_samples_per_second": 492.881,
"eval_steps_per_second": 7.907,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.7425450682640076,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0565,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.76,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6444444444444445,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6265060240963856,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.52,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.7878787878787878,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6842105263157895,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17831364274024963,
"eval_overall_accuracy": 0.9527158098933075,
"eval_overall_f1": 0.7947712418300654,
"eval_overall_precision": 0.7272727272727273,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3828,
"eval_samples_per_second": 488.483,
"eval_steps_per_second": 7.837,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.7398239374160767,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0564,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.7651006711409397,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7307692307692307,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7662337662337663,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6629213483146067,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1617172211408615,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8155080213903744,
"eval_overall_precision": 0.7605985037406484,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3803,
"eval_samples_per_second": 491.678,
"eval_steps_per_second": 7.888,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 1.9621509313583374,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.053,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.76,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7891156462585034,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7073170731707317,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1658838987350464,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8150134048257373,
"eval_overall_precision": 0.7619047619047619,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.382,
"eval_samples_per_second": 489.542,
"eval_steps_per_second": 7.854,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.8231198787689209,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0503,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16653133928775787,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.824631860776439,
"eval_overall_precision": 0.77,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.088,
"eval_steps_per_second": 7.894,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.7595716118812561,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0513,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7702702702702702,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6867469879518072,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16581283509731293,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8225806451612904,
"eval_overall_precision": 0.7707808564231738,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3809,
"eval_samples_per_second": 490.938,
"eval_steps_per_second": 7.876,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.855539858341217,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0501,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.7682119205298014,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7581699346405228,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6590909090909091,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1663612574338913,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8122503328894807,
"eval_overall_precision": 0.754950495049505,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3811,
"eval_samples_per_second": 490.649,
"eval_steps_per_second": 7.871,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 1.5128129720687866,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0497,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7785234899328859,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6904761904761905,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16162331402301788,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8197596795727637,
"eval_overall_precision": 0.763681592039801,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3826,
"eval_samples_per_second": 488.697,
"eval_steps_per_second": 7.84,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.2246452569961548,
"learning_rate": 2.5e-05,
"loss": 0.0478,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.7763157894736843,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8681672025723473,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8385093167701864,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16639897227287292,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.809078771695594,
"eval_overall_precision": 0.753731343283582,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3797,
"eval_samples_per_second": 492.491,
"eval_steps_per_second": 7.901,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.46794039011001587,
"learning_rate": 2.45e-05,
"loss": 0.0481,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1614912897348404,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8164893617021276,
"eval_overall_precision": 0.7580246913580246,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3874,
"eval_samples_per_second": 482.673,
"eval_steps_per_second": 7.743,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.9891065359115601,
"learning_rate": 2.4e-05,
"loss": 0.0467,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.7682119205298014,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6704545454545454,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17710401117801666,
"eval_overall_accuracy": 0.954898157129001,
"eval_overall_f1": 0.8078947368421052,
"eval_overall_precision": 0.7433414043583535,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3803,
"eval_samples_per_second": 491.68,
"eval_steps_per_second": 7.888,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 1.105144739151001,
"learning_rate": 2.35e-05,
"loss": 0.0454,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7341772151898734,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17059719562530518,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8192771084337349,
"eval_overall_precision": 0.765,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3808,
"eval_samples_per_second": 491.088,
"eval_steps_per_second": 7.878,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.8647188544273376,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0423,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.7651006711409397,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7307692307692307,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7972972972972974,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7108433734939759,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8653846153846153,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17431387305259705,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8161073825503355,
"eval_overall_precision": 0.7638190954773869,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.381,
"eval_samples_per_second": 490.855,
"eval_steps_per_second": 7.875,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.8007002472877502,
"learning_rate": 2.25e-05,
"loss": 0.0454,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7837837837837838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.172898069024086,
"eval_overall_accuracy": 0.9599903006789525,
"eval_overall_f1": 0.8225806451612904,
"eval_overall_precision": 0.7707808564231738,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.135,
"eval_steps_per_second": 7.895,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 1.071050763130188,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0445,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.802721088435374,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7195121951219512,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16954554617404938,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.825268817204301,
"eval_overall_precision": 0.7732997481108312,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3811,
"eval_samples_per_second": 490.727,
"eval_steps_per_second": 7.873,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.8882637619972229,
"learning_rate": 2.15e-05,
"loss": 0.0426,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.7682119205298014,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7887323943661972,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7272727272727273,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18545663356781006,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8265582655826558,
"eval_overall_precision": 0.7800511508951407,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3807,
"eval_samples_per_second": 491.172,
"eval_steps_per_second": 7.88,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.8679073452949524,
"learning_rate": 2.1e-05,
"loss": 0.0423,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7651006711409397,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7307692307692307,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7916666666666667,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7215189873417721,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17360354959964752,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8233695652173914,
"eval_overall_precision": 0.7789203084832905,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.381,
"eval_samples_per_second": 490.858,
"eval_steps_per_second": 7.875,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 2.275029420852661,
"learning_rate": 2.05e-05,
"loss": 0.0431,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.778523489932886,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7972972972972974,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7108433734939759,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1791093796491623,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8247978436657682,
"eval_overall_precision": 0.7746835443037975,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3794,
"eval_samples_per_second": 492.887,
"eval_steps_per_second": 7.907,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 2.5058839321136475,
"learning_rate": 2e-05,
"loss": 0.0428,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.778523489932886,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7792207792207791,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6741573033707865,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8782051282051282,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17754900455474854,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.823529411764706,
"eval_overall_precision": 0.7680798004987531,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3808,
"eval_samples_per_second": 491.029,
"eval_steps_per_second": 7.877,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.7865079045295715,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0413,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.7919463087248323,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7891156462585034,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7073170731707317,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.870967741935484,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16769103705883026,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.8243243243243243,
"eval_overall_precision": 0.7760814249363868,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3783,
"eval_samples_per_second": 494.306,
"eval_steps_per_second": 7.93,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.5289219617843628,
"learning_rate": 1.9e-05,
"loss": 0.0398,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.7763157894736843,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7354838709677419,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6333333333333333,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8745980707395499,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18425512313842773,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8100929614873836,
"eval_overall_precision": 0.7512315270935961,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.381,
"eval_samples_per_second": 490.826,
"eval_steps_per_second": 7.874,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.5517676472663879,
"learning_rate": 1.85e-05,
"loss": 0.0375,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.76,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7329192546583851,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6145833333333334,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18431755900382996,
"eval_overall_accuracy": 0.9541707080504365,
"eval_overall_f1": 0.8068783068783069,
"eval_overall_precision": 0.7457212713936431,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3828,
"eval_samples_per_second": 488.495,
"eval_steps_per_second": 7.837,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.43984198570251465,
"learning_rate": 1.8e-05,
"loss": 0.0393,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7945205479452054,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7160493827160493,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1756104677915573,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.827027027027027,
"eval_overall_precision": 0.7786259541984732,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3797,
"eval_samples_per_second": 492.431,
"eval_steps_per_second": 7.9,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.6901776194572449,
"learning_rate": 1.75e-05,
"loss": 0.0381,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.7631578947368421,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7682119205298013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6744186046511628,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7397260273972603,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18173794448375702,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.8203753351206434,
"eval_overall_precision": 0.7669172932330827,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3821,
"eval_samples_per_second": 489.382,
"eval_steps_per_second": 7.851,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 1.4130526781082153,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0391,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7702702702702703,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7402597402597403,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6444444444444445,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1838272213935852,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8149134487350199,
"eval_overall_precision": 0.7574257425742574,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3826,
"eval_samples_per_second": 488.807,
"eval_steps_per_second": 7.842,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.6909719109535217,
"learning_rate": 1.65e-05,
"loss": 0.0378,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.7402597402597403,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6867469879518072,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7307692307692307,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6263736263736264,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.19103722274303436,
"eval_overall_accuracy": 0.9551406401551892,
"eval_overall_f1": 0.8068783068783069,
"eval_overall_precision": 0.7457212713936431,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3805,
"eval_samples_per_second": 491.5,
"eval_steps_per_second": 7.885,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.3753189742565155,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0385,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7341772151898734,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7919463087248322,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7023809523809523,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.870967741935484,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18312758207321167,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8176943699731903,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3806,
"eval_samples_per_second": 491.353,
"eval_steps_per_second": 7.883,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 1.2078567743301392,
"learning_rate": 1.55e-05,
"loss": 0.0382,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7515923566878981,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6413043478260869,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17568355798721313,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8186666666666667,
"eval_overall_precision": 0.7617866004962779,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.048,
"eval_steps_per_second": 7.894,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.411945104598999,
"learning_rate": 1.5e-05,
"loss": 0.0363,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7972972972972974,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7108433734939759,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17883449792861938,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8274932614555257,
"eval_overall_precision": 0.7772151898734178,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3804,
"eval_samples_per_second": 491.549,
"eval_steps_per_second": 7.886,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.6801556348800659,
"learning_rate": 1.45e-05,
"loss": 0.0351,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7341772151898734,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7662337662337663,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6629213483146067,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18632389605045319,
"eval_overall_accuracy": 0.9565955383123181,
"eval_overall_f1": 0.8202396804260986,
"eval_overall_precision": 0.7623762376237624,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3814,
"eval_samples_per_second": 490.305,
"eval_steps_per_second": 7.866,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.6433190703392029,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0353,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.7631578947368421,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7341772151898733,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6236559139784946,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8838709677419355,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18783344328403473,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8116710875331565,
"eval_overall_precision": 0.7518427518427518,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3807,
"eval_samples_per_second": 491.151,
"eval_steps_per_second": 7.879,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.3200623095035553,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0343,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7581699346405228,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6590909090909091,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.17813065648078918,
"eval_overall_accuracy": 0.9575654704170709,
"eval_overall_f1": 0.8198924731182795,
"eval_overall_precision": 0.7682619647355163,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.144,
"eval_steps_per_second": 7.895,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.39253032207489014,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0338,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.7919463087248323,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7891156462585034,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7073170731707317,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18210819363594055,
"eval_overall_accuracy": 0.9616876818622696,
"eval_overall_f1": 0.830393487109905,
"eval_overall_precision": 0.7846153846153846,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3797,
"eval_samples_per_second": 492.508,
"eval_steps_per_second": 7.901,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.9440187811851501,
"learning_rate": 1.25e-05,
"loss": 0.0338,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7837837837837838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18501493334770203,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.82907133243607,
"eval_overall_precision": 0.7777777777777778,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3803,
"eval_samples_per_second": 491.709,
"eval_steps_per_second": 7.888,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.030535509809851646,
"learning_rate": 1.2e-05,
"loss": 0.0348,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.778523489932886,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8774193548387097,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18246251344680786,
"eval_overall_accuracy": 0.9597478176527643,
"eval_overall_f1": 0.8172043010752689,
"eval_overall_precision": 0.7657430730478589,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3836,
"eval_samples_per_second": 487.539,
"eval_steps_per_second": 7.821,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.3823874294757843,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0349,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7341772151898734,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7916666666666667,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7215189873417721,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1836749166250229,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8288043478260869,
"eval_overall_precision": 0.7840616966580977,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3828,
"eval_samples_per_second": 488.496,
"eval_steps_per_second": 7.837,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.7046309113502502,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0332,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18720394372940063,
"eval_overall_accuracy": 0.9597478176527643,
"eval_overall_f1": 0.8313090418353577,
"eval_overall_precision": 0.7817258883248731,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3838,
"eval_samples_per_second": 487.247,
"eval_steps_per_second": 7.817,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.7197487354278564,
"learning_rate": 1.05e-05,
"loss": 0.0348,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.7919463087248323,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.181439608335495,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.830188679245283,
"eval_overall_precision": 0.779746835443038,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3799,
"eval_samples_per_second": 492.17,
"eval_steps_per_second": 7.896,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.49554863572120667,
"learning_rate": 1e-05,
"loss": 0.0327,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7814569536423841,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.686046511627907,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18670083582401276,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8322147651006712,
"eval_overall_precision": 0.7788944723618091,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3815,
"eval_samples_per_second": 490.142,
"eval_steps_per_second": 7.863,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.4919203817844391,
"learning_rate": 9.5e-06,
"loss": 0.0304,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7891156462585034,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7073170731707317,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.18983295559883118,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8313090418353577,
"eval_overall_precision": 0.7817258883248731,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.144,
"eval_steps_per_second": 7.895,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.3511189222335815,
"learning_rate": 9e-06,
"loss": 0.0311,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.778523489932886,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7763157894736842,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6781609195402298,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19013887643814087,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8284182305630027,
"eval_overall_precision": 0.7744360902255639,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3801,
"eval_samples_per_second": 491.997,
"eval_steps_per_second": 7.893,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 1.181095838546753,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0311,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7651006711409397,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7307692307692307,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7450980392156863,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6477272727272727,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.18673187494277954,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8176943699731903,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3803,
"eval_samples_per_second": 491.728,
"eval_steps_per_second": 7.889,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.2343386560678482,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0311,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.7682119205298014,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7702702702702702,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6867469879518072,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19123651087284088,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8247978436657682,
"eval_overall_precision": 0.7746835443037975,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3809,
"eval_samples_per_second": 490.888,
"eval_steps_per_second": 7.875,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.7187972664833069,
"learning_rate": 7.5e-06,
"loss": 0.0316,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7651006711409396,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6785714285714286,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19598372280597687,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.82907133243607,
"eval_overall_precision": 0.7777777777777778,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3804,
"eval_samples_per_second": 491.562,
"eval_steps_per_second": 7.886,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.7457745671272278,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0302,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.794701986754967,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6551724137931034,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7105263157894738,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.627906976744186,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19160479307174683,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8257372654155496,
"eval_overall_precision": 0.7719298245614035,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3793,
"eval_samples_per_second": 493.05,
"eval_steps_per_second": 7.91,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.7893774509429932,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0302,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7532467532467532,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.651685393258427,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19260451197624207,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8310991957104558,
"eval_overall_precision": 0.7769423558897243,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3814,
"eval_samples_per_second": 490.309,
"eval_steps_per_second": 7.866,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.9674557447433472,
"learning_rate": 6e-06,
"loss": 0.0301,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7549668874172185,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6627906976744186,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19156460464000702,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8268456375838926,
"eval_overall_precision": 0.7738693467336684,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.071,
"eval_steps_per_second": 7.894,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.4081524610519409,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0291,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.794701986754967,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7549668874172185,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6627906976744186,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8932038834951457,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1988055408000946,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.822429906542056,
"eval_overall_precision": 0.7661691542288557,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3814,
"eval_samples_per_second": 490.312,
"eval_steps_per_second": 7.866,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 1.2055195569992065,
"learning_rate": 5e-06,
"loss": 0.029,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.7972972972972973,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7682119205298013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6744186046511628,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19222281873226166,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8306451612903226,
"eval_overall_precision": 0.7783375314861462,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3817,
"eval_samples_per_second": 489.931,
"eval_steps_per_second": 7.86,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 1.7582001686096191,
"learning_rate": 4.5e-06,
"loss": 0.0281,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7549668874172185,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6627906976744186,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19376523792743683,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8268456375838926,
"eval_overall_precision": 0.7738693467336684,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.381,
"eval_samples_per_second": 490.839,
"eval_steps_per_second": 7.874,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.382251501083374,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0293,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.7549668874172185,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7125,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6551724137931034,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19469353556632996,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8181818181818181,
"eval_overall_precision": 0.7630922693266833,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3841,
"eval_samples_per_second": 486.911,
"eval_steps_per_second": 7.811,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.3737156391143799,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0279,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6551724137931034,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1938970983028412,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8213333333333332,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3809,
"eval_samples_per_second": 490.922,
"eval_steps_per_second": 7.876,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.39239442348480225,
"learning_rate": 3e-06,
"loss": 0.0284,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.7581699346405228,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7073170731707317,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7549668874172185,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6627906976744186,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19448162615299225,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8181818181818181,
"eval_overall_precision": 0.7630922693266833,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.3812,
"eval_samples_per_second": 490.524,
"eval_steps_per_second": 7.869,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.2501358091831207,
"learning_rate": 2.5e-06,
"loss": 0.0277,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.778523489932886,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19271968305110931,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8263795423956932,
"eval_overall_precision": 0.7752525252525253,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.071,
"eval_steps_per_second": 7.894,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.3346474766731262,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0287,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.7919463087248323,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19360853731632233,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.82907133243607,
"eval_overall_precision": 0.7777777777777778,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3831,
"eval_samples_per_second": 488.178,
"eval_steps_per_second": 7.832,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.5980328917503357,
"learning_rate": 1.5e-06,
"loss": 0.0295,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1938299536705017,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8306451612903226,
"eval_overall_precision": 0.7783375314861462,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.381,
"eval_samples_per_second": 490.819,
"eval_steps_per_second": 7.874,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.5382476449012756,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.028,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.19374345242977142,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8306451612903226,
"eval_overall_precision": 0.7783375314861462,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3823,
"eval_samples_per_second": 489.131,
"eval_steps_per_second": 7.847,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.7957453727722168,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0288,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7682119205298013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6744186046511628,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1937512904405594,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8268456375838926,
"eval_overall_precision": 0.7738693467336684,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3822,
"eval_samples_per_second": 489.325,
"eval_steps_per_second": 7.85,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.36327624320983887,
"learning_rate": 0.0,
"loss": 0.0272,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7297297297297297,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1937185674905777,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8279569892473119,
"eval_overall_precision": 0.7758186397984886,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3796,
"eval_samples_per_second": 492.654,
"eval_steps_per_second": 7.904,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5123217774191952.0,
"train_loss": 0.07702873169251208,
"train_runtime": 615.3274,
"train_samples_per_second": 274.326,
"train_steps_per_second": 17.227
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5123217774191952.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}