nerugm-seq_bn-1 / trainer_state.json
apwic's picture
End of training
cace13f verified
raw
history blame contribute delete
No virus
144 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.289084553718567,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9293,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.012738853503184716,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.25,
"eval_PERSON_recall": 0.006535947712418301,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.6359996199607849,
"eval_overall_accuracy": 0.8357691354966559,
"eval_overall_f1": 0.005698005698005698,
"eval_overall_precision": 0.2,
"eval_overall_recall": 0.002890173410404624,
"eval_runtime": 0.3296,
"eval_samples_per_second": 567.378,
"eval_steps_per_second": 9.102,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.5572154521942139,
"learning_rate": 4.9e-05,
"loss": 0.5712,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.22471910112359553,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.5,
"eval_LOCATION_recall": 0.14492753623188406,
"eval_ORGANIZATION_f1": 0.046511627906976744,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.08,
"eval_ORGANIZATION_recall": 0.03278688524590164,
"eval_PERSON_f1": 0.45,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.4311377245508982,
"eval_PERSON_recall": 0.47058823529411764,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.5384615384615384,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.45161290322580644,
"eval_loss": 0.43386390805244446,
"eval_overall_accuracy": 0.8806044092147635,
"eval_overall_f1": 0.33851468048359246,
"eval_overall_precision": 0.4206008583690987,
"eval_overall_recall": 0.2832369942196532,
"eval_runtime": 0.3244,
"eval_samples_per_second": 576.457,
"eval_steps_per_second": 9.248,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.6938573122024536,
"learning_rate": 4.85e-05,
"loss": 0.4084,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.5405405405405406,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.5063291139240507,
"eval_LOCATION_recall": 0.5797101449275363,
"eval_ORGANIZATION_f1": 0.29059829059829057,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.30357142857142855,
"eval_ORGANIZATION_recall": 0.2786885245901639,
"eval_PERSON_f1": 0.6467391304347827,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.5534883720930233,
"eval_PERSON_recall": 0.7777777777777778,
"eval_QUANTITY_f1": 0.22580645161290322,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.23333333333333334,
"eval_QUANTITY_recall": 0.21875,
"eval_TIME_f1": 0.6875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.7096774193548387,
"eval_loss": 0.3173196017742157,
"eval_overall_accuracy": 0.9165221699281645,
"eval_overall_f1": 0.5401844532279314,
"eval_overall_precision": 0.4963680387409201,
"eval_overall_recall": 0.5924855491329479,
"eval_runtime": 0.3294,
"eval_samples_per_second": 567.711,
"eval_steps_per_second": 9.108,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 3.1388819217681885,
"learning_rate": 4.8e-05,
"loss": 0.306,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.6143790849673202,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.5595238095238095,
"eval_LOCATION_recall": 0.6811594202898551,
"eval_ORGANIZATION_f1": 0.4444444444444445,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.4642857142857143,
"eval_ORGANIZATION_recall": 0.4262295081967213,
"eval_PERSON_f1": 0.7669616519174042,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.6989247311827957,
"eval_PERSON_recall": 0.8496732026143791,
"eval_QUANTITY_f1": 0.6086956521739131,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5675675675675675,
"eval_QUANTITY_recall": 0.65625,
"eval_TIME_f1": 0.8064516129032258,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8064516129032258,
"eval_loss": 0.22655707597732544,
"eval_overall_accuracy": 0.9370819915779044,
"eval_overall_f1": 0.672972972972973,
"eval_overall_precision": 0.631979695431472,
"eval_overall_recall": 0.7196531791907514,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.669,
"eval_steps_per_second": 9.011,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 2.1097211837768555,
"learning_rate": 4.75e-05,
"loss": 0.2369,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.6285714285714286,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.5188679245283019,
"eval_LOCATION_recall": 0.7971014492753623,
"eval_ORGANIZATION_f1": 0.5442176870748299,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.46511627906976744,
"eval_ORGANIZATION_recall": 0.6557377049180327,
"eval_PERSON_f1": 0.7930029154518949,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.7157894736842105,
"eval_PERSON_recall": 0.8888888888888888,
"eval_QUANTITY_f1": 0.5499999999999999,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.4583333333333333,
"eval_QUANTITY_recall": 0.6875,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.21178996562957764,
"eval_overall_accuracy": 0.9380728263562051,
"eval_overall_f1": 0.6897404202719406,
"eval_overall_precision": 0.6025917926565875,
"eval_overall_recall": 0.8063583815028902,
"eval_runtime": 0.3324,
"eval_samples_per_second": 562.65,
"eval_steps_per_second": 9.026,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.1763736009597778,
"learning_rate": 4.7e-05,
"loss": 0.1993,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7037037037037037,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6129032258064516,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6153846153846154,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5365853658536586,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.8195718654434252,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.7701149425287356,
"eval_PERSON_recall": 0.8758169934640523,
"eval_QUANTITY_f1": 0.5753424657534246,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5121951219512195,
"eval_QUANTITY_recall": 0.65625,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.17126347124576569,
"eval_overall_accuracy": 0.9482288828337875,
"eval_overall_f1": 0.7369791666666667,
"eval_overall_precision": 0.6706161137440758,
"eval_overall_recall": 0.8179190751445087,
"eval_runtime": 0.3356,
"eval_samples_per_second": 557.292,
"eval_steps_per_second": 8.941,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 1.0250859260559082,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1745,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7466666666666666,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.691358024691358,
"eval_LOCATION_recall": 0.8115942028985508,
"eval_ORGANIZATION_f1": 0.6122448979591837,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5232558139534884,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.8385093167701864,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.7988165680473372,
"eval_PERSON_recall": 0.8823529411764706,
"eval_QUANTITY_f1": 0.6216216216216217,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5476190476190477,
"eval_QUANTITY_recall": 0.71875,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15598997473716736,
"eval_overall_accuracy": 0.9512013871686896,
"eval_overall_f1": 0.7566137566137565,
"eval_overall_precision": 0.697560975609756,
"eval_overall_recall": 0.8265895953757225,
"eval_runtime": 0.3325,
"eval_samples_per_second": 562.394,
"eval_steps_per_second": 9.022,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.9757563471794128,
"learning_rate": 4.600000000000001e-05,
"loss": 0.158,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7023809523809523,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6344827586206897,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5476190476190477,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.8411214953271029,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8035714285714286,
"eval_PERSON_recall": 0.8823529411764706,
"eval_QUANTITY_f1": 0.6301369863013699,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5609756097560976,
"eval_QUANTITY_recall": 0.71875,
"eval_TIME_f1": 0.7536231884057972,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6842105263157895,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.15038101375102997,
"eval_overall_accuracy": 0.9521922219469904,
"eval_overall_f1": 0.7595269382391591,
"eval_overall_precision": 0.6963855421686747,
"eval_overall_recall": 0.8352601156069365,
"eval_runtime": 0.3277,
"eval_samples_per_second": 570.677,
"eval_steps_per_second": 9.155,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.060363531112671,
"learning_rate": 4.55e-05,
"loss": 0.1464,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7692307692307693,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6896551724137931,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6153846153846154,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5365853658536586,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.8490566037735848,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8181818181818182,
"eval_PERSON_recall": 0.8823529411764706,
"eval_QUANTITY_f1": 0.6666666666666665,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.75,
"eval_TIME_f1": 0.787878787878788,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14481940865516663,
"eval_overall_accuracy": 0.9529353480307159,
"eval_overall_f1": 0.7655629139072848,
"eval_overall_precision": 0.706601466992665,
"eval_overall_recall": 0.8352601156069365,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.801,
"eval_steps_per_second": 9.013,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 0.9707283973693848,
"learning_rate": 4.5e-05,
"loss": 0.14,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.786206896551724,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6222222222222222,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5675675675675675,
"eval_ORGANIZATION_recall": 0.6885245901639344,
"eval_PERSON_f1": 0.8444444444444443,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8209876543209876,
"eval_PERSON_recall": 0.869281045751634,
"eval_QUANTITY_f1": 0.7246376811594203,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13176114857196808,
"eval_overall_accuracy": 0.9583849393113698,
"eval_overall_f1": 0.7770177838577291,
"eval_overall_precision": 0.7376623376623377,
"eval_overall_recall": 0.8208092485549133,
"eval_runtime": 0.3277,
"eval_samples_per_second": 570.689,
"eval_steps_per_second": 9.155,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.8272536396980286,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1336,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6941176470588235,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6259541984732824,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5857142857142857,
"eval_ORGANIZATION_recall": 0.6721311475409836,
"eval_PERSON_f1": 0.860759493670886,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.8888888888888888,
"eval_QUANTITY_f1": 0.6575342465753423,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5853658536585366,
"eval_QUANTITY_recall": 0.75,
"eval_TIME_f1": 0.7941176470588235,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7297297297297297,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13256430625915527,
"eval_overall_accuracy": 0.955907852365618,
"eval_overall_f1": 0.7735849056603774,
"eval_overall_precision": 0.7247474747474747,
"eval_overall_recall": 0.8294797687861272,
"eval_runtime": 0.3322,
"eval_samples_per_second": 562.93,
"eval_steps_per_second": 9.031,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 2.3991382122039795,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.126,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7894736842105263,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6616541353383459,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6111111111111112,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.8695652173913043,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8284023668639053,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.6486486486486486,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5714285714285714,
"eval_QUANTITY_recall": 0.75,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13229668140411377,
"eval_overall_accuracy": 0.9568986871439188,
"eval_overall_f1": 0.7887700534759359,
"eval_overall_precision": 0.7338308457711443,
"eval_overall_recall": 0.8526011560693642,
"eval_runtime": 0.3344,
"eval_samples_per_second": 559.23,
"eval_steps_per_second": 8.972,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.8172109723091125,
"learning_rate": 4.35e-05,
"loss": 0.1209,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7947019867549668,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6808510638297871,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.8687500000000001,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8323353293413174,
"eval_PERSON_recall": 0.9084967320261438,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.12979264557361603,
"eval_overall_accuracy": 0.9601189001733961,
"eval_overall_f1": 0.8026845637583893,
"eval_overall_precision": 0.7493734335839599,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.3357,
"eval_samples_per_second": 557.123,
"eval_steps_per_second": 8.938,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.386945366859436,
"learning_rate": 4.3e-05,
"loss": 0.1172,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5698924731182796,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8650306748466258,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.815028901734104,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.6486486486486486,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5714285714285714,
"eval_QUANTITY_recall": 0.75,
"eval_TIME_f1": 0.7536231884057972,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6842105263157895,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14491254091262817,
"eval_overall_accuracy": 0.9529353480307159,
"eval_overall_f1": 0.7839586028460543,
"eval_overall_precision": 0.7096018735362998,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3283,
"eval_samples_per_second": 569.521,
"eval_steps_per_second": 9.137,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.46282199025154114,
"learning_rate": 4.25e-05,
"loss": 0.1135,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6969696969696969,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.647887323943662,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.8580441640378549,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8292682926829268,
"eval_PERSON_recall": 0.8888888888888888,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.12623363733291626,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8032786885245903,
"eval_overall_precision": 0.7616580310880829,
"eval_overall_recall": 0.8497109826589595,
"eval_runtime": 0.3327,
"eval_samples_per_second": 562.012,
"eval_steps_per_second": 9.016,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.5779574513435364,
"learning_rate": 4.2e-05,
"loss": 0.1087,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.620253164556962,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8624999999999999,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8263473053892215,
"eval_PERSON_recall": 0.9019607843137255,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1268586367368698,
"eval_overall_accuracy": 0.9611097349516968,
"eval_overall_f1": 0.8070175438596492,
"eval_overall_precision": 0.7569620253164557,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.326,
"eval_samples_per_second": 573.612,
"eval_steps_per_second": 9.202,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.2563510537147522,
"learning_rate": 4.15e-05,
"loss": 0.1041,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7375886524822695,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.8652037617554859,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.9019607843137255,
"eval_QUANTITY_f1": 0.7027027027027026,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6190476190476191,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13557660579681396,
"eval_overall_accuracy": 0.9583849393113698,
"eval_overall_f1": 0.8079999999999999,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.696,
"eval_steps_per_second": 9.011,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 2.330004930496216,
"learning_rate": 4.1e-05,
"loss": 0.102,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6818181818181818,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6338028169014085,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.8643533123028391,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.8954248366013072,
"eval_QUANTITY_f1": 0.7246376811594203,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.787878787878788,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.128007709980011,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.7994542974079127,
"eval_overall_precision": 0.7571059431524548,
"eval_overall_recall": 0.846820809248555,
"eval_runtime": 0.3322,
"eval_samples_per_second": 562.934,
"eval_steps_per_second": 9.031,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 1.4404404163360596,
"learning_rate": 4.05e-05,
"loss": 0.0999,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6715328467153285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6052631578947368,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.9019607843137255,
"eval_QUANTITY_f1": 0.6857142857142857,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.75,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.12171030044555664,
"eval_overall_accuracy": 0.9623482784245727,
"eval_overall_f1": 0.8043478260869564,
"eval_overall_precision": 0.7589743589743589,
"eval_overall_recall": 0.8554913294797688,
"eval_runtime": 0.3267,
"eval_samples_per_second": 572.375,
"eval_steps_per_second": 9.182,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.6656851768493652,
"learning_rate": 4e-05,
"loss": 0.0942,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.7894736842105263,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7391304347826089,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6623376623376623,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8757763975155279,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.834319526627219,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.782608695652174,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7105263157894737,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13243292272090912,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8100929614873839,
"eval_overall_precision": 0.7493857493857494,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3326,
"eval_samples_per_second": 562.253,
"eval_steps_per_second": 9.02,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.6464937329292297,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0932,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7770700636942676,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6931818181818182,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7361111111111112,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6385542168674698,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8730650154798762,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8294117647058824,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.6944444444444444,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.7647058823529411,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7027027027027027,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14281630516052246,
"eval_overall_accuracy": 0.9564032697547684,
"eval_overall_f1": 0.8010471204188482,
"eval_overall_precision": 0.7320574162679426,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3327,
"eval_samples_per_second": 561.987,
"eval_steps_per_second": 9.016,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 1.1358213424682617,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0916,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6710526315789473,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8785046728971961,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8392857142857143,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.12807393074035645,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8200270635994588,
"eval_overall_precision": 0.7709923664122137,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3327,
"eval_samples_per_second": 562.083,
"eval_steps_per_second": 9.017,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.7238495945930481,
"learning_rate": 3.85e-05,
"loss": 0.0892,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6710526315789473,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1260461062192917,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8216216216216216,
"eval_overall_precision": 0.7715736040609137,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3325,
"eval_samples_per_second": 562.346,
"eval_steps_per_second": 9.022,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.773553490638733,
"learning_rate": 3.8e-05,
"loss": 0.0865,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7692307692307693,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6896551724137931,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7412587412587412,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7647058823529411,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7027027027027027,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14333529770374298,
"eval_overall_accuracy": 0.9578895219222194,
"eval_overall_f1": 0.8073878627968338,
"eval_overall_precision": 0.7427184466019418,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.333,
"eval_samples_per_second": 561.546,
"eval_steps_per_second": 9.009,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 1.2657068967819214,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0834,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7746478873239437,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6790123456790124,
"eval_ORGANIZATION_recall": 0.9016393442622951,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.787878787878788,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13225042819976807,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.8246318607764391,
"eval_overall_precision": 0.7680798004987531,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3265,
"eval_samples_per_second": 572.661,
"eval_steps_per_second": 9.187,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 1.338986873626709,
"learning_rate": 3.7e-05,
"loss": 0.0823,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7638888888888888,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6626506024096386,
"eval_ORGANIZATION_recall": 0.9016393442622951,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13243231177330017,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8273092369477911,
"eval_overall_precision": 0.770573566084788,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.332,
"eval_samples_per_second": 563.211,
"eval_steps_per_second": 9.035,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 1.9946244955062866,
"learning_rate": 3.65e-05,
"loss": 0.0809,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7391304347826089,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6623376623376623,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13205386698246002,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8216216216216216,
"eval_overall_precision": 0.7715736040609137,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3268,
"eval_samples_per_second": 572.171,
"eval_steps_per_second": 9.179,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.337754487991333,
"learning_rate": 3.6e-05,
"loss": 0.0793,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6766917293233082,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.8867924528301887,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8545454545454545,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.787878787878788,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1275886595249176,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.809782608695652,
"eval_overall_precision": 0.764102564102564,
"eval_overall_recall": 0.861271676300578,
"eval_runtime": 0.3333,
"eval_samples_per_second": 561.108,
"eval_steps_per_second": 9.002,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 1.4286695718765259,
"learning_rate": 3.55e-05,
"loss": 0.0759,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7428571428571428,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6582278481012658,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.880503144654088,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13053637742996216,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8205128205128205,
"eval_overall_precision": 0.769620253164557,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3332,
"eval_samples_per_second": 561.235,
"eval_steps_per_second": 9.004,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 1.020611047744751,
"learning_rate": 3.5e-05,
"loss": 0.0742,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6235294117647059,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7164179104477612,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.75,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13522376120090485,
"eval_overall_accuracy": 0.9596234827842457,
"eval_overall_f1": 0.8139223560910309,
"eval_overall_precision": 0.7581047381546134,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.334,
"eval_samples_per_second": 559.963,
"eval_steps_per_second": 8.983,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.5647078156471252,
"learning_rate": 3.45e-05,
"loss": 0.0755,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7014925373134328,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6438356164383562,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.8777429467084639,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8433734939759037,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.12345639616250992,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8125000000000001,
"eval_overall_precision": 0.7666666666666667,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.326,
"eval_samples_per_second": 573.599,
"eval_steps_per_second": 9.202,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.8619909286499023,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0709,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.7919463087248322,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.126638263463974,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8209959623149394,
"eval_overall_precision": 0.7682619647355163,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3268,
"eval_samples_per_second": 572.145,
"eval_steps_per_second": 9.179,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 3.400688886642456,
"learning_rate": 3.35e-05,
"loss": 0.0711,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.762589928057554,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6794871794871795,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.12633301317691803,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8272108843537415,
"eval_overall_precision": 0.781491002570694,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3276,
"eval_samples_per_second": 570.79,
"eval_steps_per_second": 9.157,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.6063269376754761,
"learning_rate": 3.3e-05,
"loss": 0.0698,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.7947019867549668,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6235294117647059,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8875000000000001,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8502994011976048,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.787878787878788,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13981756567955017,
"eval_overall_accuracy": 0.9591280653950953,
"eval_overall_f1": 0.8132450331125827,
"eval_overall_precision": 0.7506112469437652,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3327,
"eval_samples_per_second": 562.139,
"eval_steps_per_second": 9.018,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 2.01218843460083,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0669,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6987951807228916,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7248322147651006,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6136363636363636,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.8895899053627759,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1391025334596634,
"eval_overall_accuracy": 0.958632648005945,
"eval_overall_f1": 0.8100929614873839,
"eval_overall_precision": 0.7493857493857494,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3328,
"eval_samples_per_second": 561.911,
"eval_steps_per_second": 9.015,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.48844727873802185,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0659,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7310344827586208,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6309523809523809,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8930817610062893,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8606060606060606,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13162988424301147,
"eval_overall_accuracy": 0.9623482784245727,
"eval_overall_f1": 0.8192771084337348,
"eval_overall_precision": 0.7630922693266833,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3328,
"eval_samples_per_second": 561.896,
"eval_steps_per_second": 9.014,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 1.3096176385879517,
"learning_rate": 3.15e-05,
"loss": 0.0627,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7297297297297297,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6206896551724138,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.8895899053627759,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13473619520664215,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8186666666666668,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3342,
"eval_samples_per_second": 559.531,
"eval_steps_per_second": 8.976,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.9041996598243713,
"learning_rate": 3.1e-05,
"loss": 0.0627,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7412587412587412,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13561618328094482,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8219544846050869,
"eval_overall_precision": 0.7655860349127181,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3327,
"eval_samples_per_second": 562.038,
"eval_steps_per_second": 9.017,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.9759089350700378,
"learning_rate": 3.05e-05,
"loss": 0.0592,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7246376811594203,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6493506493506493,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.880503144654088,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1278260350227356,
"eval_overall_accuracy": 0.964082239286599,
"eval_overall_f1": 0.8283378746594006,
"eval_overall_precision": 0.7835051546391752,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.813,
"eval_steps_per_second": 9.013,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.8231136798858643,
"learning_rate": 3e-05,
"loss": 0.06,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.7581699346405228,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6904761904761905,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7375886524822695,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.880503144654088,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13648688793182373,
"eval_overall_accuracy": 0.9598711914788209,
"eval_overall_f1": 0.8085676037483266,
"eval_overall_precision": 0.7531172069825436,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.3327,
"eval_samples_per_second": 562.148,
"eval_steps_per_second": 9.018,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.8856554627418518,
"learning_rate": 2.95e-05,
"loss": 0.0583,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7586206896551725,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.9016393442622951,
"eval_PERSON_f1": 0.8819875776397514,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8402366863905325,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1364709734916687,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.822429906542056,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3319,
"eval_samples_per_second": 563.438,
"eval_steps_per_second": 9.039,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.7966371178627014,
"learning_rate": 2.9e-05,
"loss": 0.0592,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7482993197278911,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.9016393442622951,
"eval_PERSON_f1": 0.896551724137931,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8614457831325302,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.787878787878788,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14667053520679474,
"eval_overall_accuracy": 0.9593757740896706,
"eval_overall_f1": 0.824468085106383,
"eval_overall_precision": 0.7635467980295566,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3276,
"eval_samples_per_second": 570.779,
"eval_steps_per_second": 9.157,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.6787899732589722,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0584,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7092198581560285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8875000000000001,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8502994011976048,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7123287671232876,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.787878787878788,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14089816808700562,
"eval_overall_accuracy": 0.9591280653950953,
"eval_overall_f1": 0.8133333333333334,
"eval_overall_precision": 0.754950495049505,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3317,
"eval_samples_per_second": 563.793,
"eval_steps_per_second": 9.045,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 1.8825234174728394,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0571,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7361111111111112,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6385542168674698,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1371491551399231,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8209959623149394,
"eval_overall_precision": 0.7682619647355163,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3331,
"eval_samples_per_second": 561.467,
"eval_steps_per_second": 9.007,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 1.0761770009994507,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0568,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.75177304964539,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6625,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9084967320261438,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8709677419354839,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8709677419354839,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1322641521692276,
"eval_overall_accuracy": 0.9633391132028735,
"eval_overall_f1": 0.8310626702997275,
"eval_overall_precision": 0.7860824742268041,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3327,
"eval_samples_per_second": 562.056,
"eval_steps_per_second": 9.017,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.5931002497673035,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0518,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7023809523809523,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7361111111111112,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6385542168674698,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8924050632911392,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8650306748466258,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7142857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14024412631988525,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8165997322623829,
"eval_overall_precision": 0.7605985037406484,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3334,
"eval_samples_per_second": 560.842,
"eval_steps_per_second": 8.997,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.7838124632835388,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0529,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7919463087248322,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7310344827586208,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6309523809523809,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7246376811594203,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1365956962108612,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8172043010752688,
"eval_overall_precision": 0.7638190954773869,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3326,
"eval_samples_per_second": 562.284,
"eval_steps_per_second": 9.021,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 1.4798297882080078,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0516,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7153284671532848,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6447368421052632,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.880503144654088,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14157778024673462,
"eval_overall_accuracy": 0.9598711914788209,
"eval_overall_f1": 0.8167115902964959,
"eval_overall_precision": 0.7651515151515151,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3333,
"eval_samples_per_second": 561.042,
"eval_steps_per_second": 9.001,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.9078386425971985,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0524,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7285714285714285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6455696202531646,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8930817610062893,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8606060606060606,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14155249297618866,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8286099865047234,
"eval_overall_precision": 0.7772151898734178,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3319,
"eval_samples_per_second": 563.426,
"eval_steps_per_second": 9.039,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.6509796380996704,
"learning_rate": 2.5e-05,
"loss": 0.0494,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6710526315789473,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8867924528301887,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8545454545454545,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1381203830242157,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8254397834912043,
"eval_overall_precision": 0.7760814249363868,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3345,
"eval_samples_per_second": 559.02,
"eval_steps_per_second": 8.968,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.7626707553863525,
"learning_rate": 2.45e-05,
"loss": 0.0478,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7297297297297297,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6206896551724138,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.8867924528301887,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8545454545454545,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14348609745502472,
"eval_overall_accuracy": 0.9623482784245727,
"eval_overall_f1": 0.8310991957104559,
"eval_overall_precision": 0.775,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3315,
"eval_samples_per_second": 564.037,
"eval_steps_per_second": 9.049,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.5748308300971985,
"learning_rate": 2.4e-05,
"loss": 0.0485,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7432432432432433,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.9016393442622951,
"eval_PERSON_f1": 0.8867924528301887,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8545454545454545,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14024515450000763,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.836021505376344,
"eval_overall_precision": 0.7814070351758794,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3324,
"eval_samples_per_second": 562.57,
"eval_steps_per_second": 9.025,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 1.001908779144287,
"learning_rate": 2.35e-05,
"loss": 0.0475,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6235294117647059,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13823822140693665,
"eval_overall_accuracy": 0.9630914045082982,
"eval_overall_f1": 0.8313090418353577,
"eval_overall_precision": 0.779746835443038,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3335,
"eval_samples_per_second": 560.779,
"eval_steps_per_second": 8.996,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.5605162382125854,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0481,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.7919463087248322,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7285714285714285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6455696202531646,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8867924528301887,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8545454545454545,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14209988713264465,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8209959623149394,
"eval_overall_precision": 0.7682619647355163,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.696,
"eval_steps_per_second": 9.011,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 1.0782426595687866,
"learning_rate": 2.25e-05,
"loss": 0.0474,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7432432432432433,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.9016393442622951,
"eval_PERSON_f1": 0.8909657320872275,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8511904761904762,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14407247304916382,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.8346666666666667,
"eval_overall_precision": 0.7747524752475248,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.3328,
"eval_samples_per_second": 561.974,
"eval_steps_per_second": 9.016,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 2.055668592453003,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0456,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7153284671532848,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6447368421052632,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8930817610062893,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8606060606060606,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14129342138767242,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.8183041722745625,
"eval_overall_precision": 0.7657430730478589,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3322,
"eval_samples_per_second": 562.981,
"eval_steps_per_second": 9.032,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.7829787135124207,
"learning_rate": 2.15e-05,
"loss": 0.0451,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7428571428571428,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6582278481012658,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.89375,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8562874251497006,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14520226418972015,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8268456375838926,
"eval_overall_precision": 0.7719298245614035,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3271,
"eval_samples_per_second": 571.771,
"eval_steps_per_second": 9.173,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.2567724287509918,
"learning_rate": 2.1e-05,
"loss": 0.0437,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7222222222222222,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6265060240963856,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.8958990536277602,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8658536585365854,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14597974717617035,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8219544846050869,
"eval_overall_precision": 0.7655860349127181,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3323,
"eval_samples_per_second": 562.69,
"eval_steps_per_second": 9.027,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.4437527656555176,
"learning_rate": 2.05e-05,
"loss": 0.0424,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7272727272727272,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6341463414634146,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.8875000000000001,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8502994011976048,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1500689834356308,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8186666666666668,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3324,
"eval_samples_per_second": 562.659,
"eval_steps_per_second": 9.027,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.7316974997520447,
"learning_rate": 2e-05,
"loss": 0.0423,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8847352024922119,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8452380952380952,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15397267043590546,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8169761273209548,
"eval_overall_precision": 0.7549019607843137,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3265,
"eval_samples_per_second": 572.825,
"eval_steps_per_second": 9.19,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.7264176607131958,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.041,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6235294117647059,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.147948756814003,
"eval_overall_accuracy": 0.9611097349516968,
"eval_overall_f1": 0.8208556149732621,
"eval_overall_precision": 0.763681592039801,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3335,
"eval_samples_per_second": 560.648,
"eval_steps_per_second": 8.994,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.7140088677406311,
"learning_rate": 1.9e-05,
"loss": 0.0405,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6329113924050633,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8847352024922119,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8452380952380952,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.148734450340271,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8150134048257373,
"eval_overall_precision": 0.76,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.333,
"eval_samples_per_second": 561.598,
"eval_steps_per_second": 9.01,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 1.8145302534103394,
"learning_rate": 1.85e-05,
"loss": 0.0394,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6235294117647059,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.8902821316614421,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8554216867469879,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14801925420761108,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8241610738255033,
"eval_overall_precision": 0.7694235588972431,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3325,
"eval_samples_per_second": 562.37,
"eval_steps_per_second": 9.022,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 1.2566087245941162,
"learning_rate": 1.8e-05,
"loss": 0.0384,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.627906976744186,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.89375,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8562874251497006,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15676021575927734,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.824468085106383,
"eval_overall_precision": 0.7635467980295566,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.333,
"eval_samples_per_second": 561.621,
"eval_steps_per_second": 9.01,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 1.431575894355774,
"learning_rate": 1.75e-05,
"loss": 0.0397,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6993006993006993,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6097560975609756,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8785046728971961,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8392857142857143,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14874185621738434,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8170894526034712,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3264,
"eval_samples_per_second": 572.977,
"eval_steps_per_second": 9.192,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 1.1114250421524048,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0388,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7023809523809523,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7074829931972788,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6046511627906976,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.8916408668730651,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8470588235294118,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1624731570482254,
"eval_overall_accuracy": 0.9601189001733961,
"eval_overall_f1": 0.8153034300791557,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.3323,
"eval_samples_per_second": 562.754,
"eval_steps_per_second": 9.028,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 2.434706926345825,
"learning_rate": 1.65e-05,
"loss": 0.0402,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7123287671232876,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.611764705882353,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.8909657320872275,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8511904761904762,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1620258390903473,
"eval_overall_accuracy": 0.9596234827842457,
"eval_overall_f1": 0.8201058201058201,
"eval_overall_precision": 0.7560975609756098,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3325,
"eval_samples_per_second": 562.349,
"eval_steps_per_second": 9.022,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.43614867329597473,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0397,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7183098591549297,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6296296296296297,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1530744731426239,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8155080213903744,
"eval_overall_precision": 0.7587064676616916,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.328,
"eval_samples_per_second": 570.186,
"eval_steps_per_second": 9.147,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 1.2761048078536987,
"learning_rate": 1.55e-05,
"loss": 0.0383,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7034482758620689,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6071428571428571,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8847352024922119,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8452380952380952,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15172313153743744,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.8219544846050869,
"eval_overall_precision": 0.7655860349127181,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3319,
"eval_samples_per_second": 563.458,
"eval_steps_per_second": 9.039,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 1.8664883375167847,
"learning_rate": 1.5e-05,
"loss": 0.0375,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6190476190476191,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.8875000000000001,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8502994011976048,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1547580361366272,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.8208556149732621,
"eval_overall_precision": 0.763681592039801,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3256,
"eval_samples_per_second": 574.274,
"eval_steps_per_second": 9.213,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 2.3128960132598877,
"learning_rate": 1.45e-05,
"loss": 0.0368,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.689655172413793,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5952380952380952,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15528355538845062,
"eval_overall_accuracy": 0.9598711914788209,
"eval_overall_f1": 0.8117489986648866,
"eval_overall_precision": 0.7543424317617866,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3322,
"eval_samples_per_second": 562.889,
"eval_steps_per_second": 9.03,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 2.342613458633423,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0375,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6329113924050633,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15482325851917267,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.8150134048257373,
"eval_overall_precision": 0.76,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3322,
"eval_samples_per_second": 562.879,
"eval_steps_per_second": 9.03,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 2.5355284214019775,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0364,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6950354609929078,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6125,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15112702548503876,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.811320754716981,
"eval_overall_precision": 0.76010101010101,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.3265,
"eval_samples_per_second": 572.81,
"eval_steps_per_second": 9.189,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 2.763317108154297,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0356,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6944444444444445,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6024096385542169,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15702202916145325,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8128342245989304,
"eval_overall_precision": 0.7562189054726368,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3325,
"eval_samples_per_second": 562.361,
"eval_steps_per_second": 9.022,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.9147346615791321,
"learning_rate": 1.25e-05,
"loss": 0.0345,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7132867132867133,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6219512195121951,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8875000000000001,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8502994011976048,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.160079225897789,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.8192771084337348,
"eval_overall_precision": 0.7630922693266833,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3259,
"eval_samples_per_second": 573.758,
"eval_steps_per_second": 9.205,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.9755911827087402,
"learning_rate": 1.2e-05,
"loss": 0.0358,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7023809523809523,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6190476190476191,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15988942980766296,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.816,
"eval_overall_precision": 0.7574257425742574,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3322,
"eval_samples_per_second": 562.905,
"eval_steps_per_second": 9.031,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.6485092639923096,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0359,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7092198581560285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15627126395702362,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8236877523553163,
"eval_overall_precision": 0.7707808564231738,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.333,
"eval_samples_per_second": 561.64,
"eval_steps_per_second": 9.01,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.8235780596733093,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0328,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7050359712230215,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6282051282051282,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15545301139354706,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8216216216216216,
"eval_overall_precision": 0.7715736040609137,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3276,
"eval_samples_per_second": 570.819,
"eval_steps_per_second": 9.158,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 1.297727108001709,
"learning_rate": 1.05e-05,
"loss": 0.034,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7183098591549297,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6296296296296297,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1584213823080063,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.8187919463087249,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3318,
"eval_samples_per_second": 563.58,
"eval_steps_per_second": 9.041,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 1.0464829206466675,
"learning_rate": 1e-05,
"loss": 0.0344,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6329113924050633,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15635241568088531,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8216216216216216,
"eval_overall_precision": 0.7715736040609137,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3334,
"eval_samples_per_second": 560.931,
"eval_steps_per_second": 8.999,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 1.1984474658966064,
"learning_rate": 9.5e-06,
"loss": 0.0337,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6950354609929078,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6125,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16573630273342133,
"eval_overall_accuracy": 0.9601189001733961,
"eval_overall_f1": 0.8150134048257373,
"eval_overall_precision": 0.76,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3335,
"eval_samples_per_second": 560.721,
"eval_steps_per_second": 8.996,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.3891063928604126,
"learning_rate": 9e-06,
"loss": 0.0331,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6986301369863014,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16680771112442017,
"eval_overall_accuracy": 0.9601189001733961,
"eval_overall_f1": 0.8186666666666668,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.326,
"eval_samples_per_second": 573.602,
"eval_steps_per_second": 9.202,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 1.0325218439102173,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0328,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6329113924050633,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.880503144654088,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15955756604671478,
"eval_overall_accuracy": 0.9611097349516968,
"eval_overall_f1": 0.8167115902964959,
"eval_overall_precision": 0.7651515151515151,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3325,
"eval_samples_per_second": 562.469,
"eval_steps_per_second": 9.024,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 1.833433747291565,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0339,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.723404255319149,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6375,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15904375910758972,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.8183041722745625,
"eval_overall_precision": 0.7657430730478589,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3326,
"eval_samples_per_second": 562.206,
"eval_steps_per_second": 9.019,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.8579007983207703,
"learning_rate": 7.5e-06,
"loss": 0.0324,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6906474820143885,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6153846153846154,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.8742138364779874,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8424242424242424,
"eval_PERSON_recall": 0.9084967320261438,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15392935276031494,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.8092016238159675,
"eval_overall_precision": 0.7608142493638677,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.3321,
"eval_samples_per_second": 563.068,
"eval_steps_per_second": 9.033,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 2.3941845893859863,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0327,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6762589928057554,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6025641025641025,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.875,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8383233532934131,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1588955819606781,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8053691275167784,
"eval_overall_precision": 0.7518796992481203,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.3263,
"eval_samples_per_second": 573.03,
"eval_steps_per_second": 9.193,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 1.8358588218688965,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0318,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.723404255319149,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6375,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16152726113796234,
"eval_overall_accuracy": 0.9611097349516968,
"eval_overall_f1": 0.8198924731182795,
"eval_overall_precision": 0.7663316582914573,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3317,
"eval_samples_per_second": 563.682,
"eval_steps_per_second": 9.043,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 2.0525128841400146,
"learning_rate": 6e-06,
"loss": 0.0311,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6906474820143885,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6153846153846154,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16066040098667145,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.8129205921938087,
"eval_overall_precision": 0.760705289672544,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.3324,
"eval_samples_per_second": 562.545,
"eval_steps_per_second": 9.025,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.892722487449646,
"learning_rate": 5.500000000000001e-06,
"loss": 0.033,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6956521739130435,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6233766233766234,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16328519582748413,
"eval_overall_accuracy": 0.9601189001733961,
"eval_overall_f1": 0.8118279569892471,
"eval_overall_precision": 0.7587939698492462,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.3318,
"eval_samples_per_second": 563.6,
"eval_steps_per_second": 9.042,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 1.3466918468475342,
"learning_rate": 5e-06,
"loss": 0.0314,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.620253164556962,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1654297560453415,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8183041722745625,
"eval_overall_precision": 0.7657430730478589,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3339,
"eval_samples_per_second": 560.083,
"eval_steps_per_second": 8.985,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.5831097960472107,
"learning_rate": 4.5e-06,
"loss": 0.0317,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.620253164556962,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16038751602172852,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.8145161290322581,
"eval_overall_precision": 0.7613065326633166,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3258,
"eval_samples_per_second": 573.92,
"eval_steps_per_second": 9.207,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 2.8795530796051025,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0313,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6329113924050633,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16018863022327423,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.8156123822341858,
"eval_overall_precision": 0.7632241813602015,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3325,
"eval_samples_per_second": 562.323,
"eval_steps_per_second": 9.021,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.9272975325584412,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0317,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6329113924050633,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16194607317447662,
"eval_overall_accuracy": 0.9611097349516968,
"eval_overall_f1": 0.8183041722745625,
"eval_overall_precision": 0.7657430730478589,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3339,
"eval_samples_per_second": 560.094,
"eval_steps_per_second": 8.985,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 1.6155447959899902,
"learning_rate": 3e-06,
"loss": 0.0322,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7272727272727272,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6341463414634146,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16590212285518646,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.8203753351206433,
"eval_overall_precision": 0.765,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.332,
"eval_samples_per_second": 563.263,
"eval_steps_per_second": 9.036,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.8714067339897156,
"learning_rate": 2.5e-06,
"loss": 0.0305,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6993006993006993,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6097560975609756,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16414810717105865,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8128342245989304,
"eval_overall_precision": 0.7562189054726368,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3262,
"eval_samples_per_second": 573.227,
"eval_steps_per_second": 9.196,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.7234588265419006,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0302,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7050359712230215,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6282051282051282,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1619059145450592,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.8167115902964959,
"eval_overall_precision": 0.7651515151515151,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3323,
"eval_samples_per_second": 562.669,
"eval_steps_per_second": 9.027,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 1.2419594526290894,
"learning_rate": 1.5e-06,
"loss": 0.0309,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7183098591549297,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6296296296296297,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1639154851436615,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.8187919463087249,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3326,
"eval_samples_per_second": 562.252,
"eval_steps_per_second": 9.02,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.3145425021648407,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0288,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6993006993006993,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6097560975609756,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16421489417552948,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8139223560910309,
"eval_overall_precision": 0.7581047381546134,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3325,
"eval_samples_per_second": 562.38,
"eval_steps_per_second": 9.022,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.6178627610206604,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0307,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6901408450704226,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6049382716049383,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1645815670490265,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8112449799196787,
"eval_overall_precision": 0.7556109725685786,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.332,
"eval_samples_per_second": 563.213,
"eval_steps_per_second": 9.036,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 1.0940686464309692,
"learning_rate": 0.0,
"loss": 0.032,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6993006993006993,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6097560975609756,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8840125391849529,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1641756296157837,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8128342245989304,
"eval_overall_precision": 0.7562189054726368,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3326,
"eval_samples_per_second": 562.318,
"eval_steps_per_second": 9.021,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4608467078884878.0,
"train_loss": 0.08280598743906561,
"train_runtime": 623.2047,
"train_samples_per_second": 270.698,
"train_steps_per_second": 17.009
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4608467078884878.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}